<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2008-9-6-r94</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Ch&#230;tognath transcriptome reveals ancestral and unique features among bilaterians</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Marl&#233;taz</snm>
               <fnm>Ferdinand</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>ferdinand.marletaz@univmed.fr</email>
            </au>
            <au id="A2">
               <snm>Gilles</snm>
               <fnm>Andr&#233;</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>andre.gilles@univ-provence.fr</email>
            </au>
            <au id="A3">
               <snm>Caubit</snm>
               <fnm>Xavier</fnm>
               <insr iid="I2"/>
               <insr iid="I5"/>
               <email>caubit@ibdm.univ-mrs.fr</email>
            </au>
            <au id="A4">
               <snm>Perez</snm>
               <fnm>Yvan</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>perezyvan@hotmail.com</email>
            </au>
            <au id="A5">
               <snm>Dossat</snm>
               <fnm>Carole</fnm>
               <insr iid="I6"/>
               <insr iid="I7"/>
               <insr iid="I8"/>
               <email>cdossat@genoscope.cns.fr</email>
            </au>
            <au id="A6">
               <snm>Samain</snm>
               <fnm>Sylvie</fnm>
               <insr iid="I6"/>
               <insr iid="I7"/>
               <insr iid="I8"/>
               <email>samain@genoscope.cns.fr</email>
            </au>
            <au id="A7">
               <snm>Gyapay</snm>
               <fnm>Gabor</fnm>
               <insr iid="I6"/>
               <insr iid="I7"/>
               <insr iid="I8"/>
               <email>gabor@genoscope.cns.fr</email>
            </au>
            <au id="A8">
               <snm>Wincker</snm>
               <fnm>Patrick</fnm>
               <insr iid="I6"/>
               <insr iid="I7"/>
               <insr iid="I8"/>
               <email>wincker@genoscope.cns.fr</email>
            </au>
            <au id="A9" ca="yes">
               <snm>Le Parco</snm>
               <fnm>Yannick</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>yannick.leparco@univmed.fr</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>CNRS UMR 6540 DIMAR, Station Marine d'Endoume, Centre d'Oc&#233;anologie de Marseille, Chemin de la Batterie des Lions, 13007, Marseille, France</p>
            </ins>
            <ins id="I2">
               <p>Universit&#233; de la M&#233;diterran&#233;e Aix-Marseille II, Bd Charles Livon, 13284, Marseille, France</p>
            </ins>
            <ins id="I3">
               <p>Universit&#233; de Provence Aix-Marseille I, place Victor-Hugo, 13331, Marseille, France</p>
            </ins>
            <ins id="I4">
               <p>CNRS UMR 6116 IMEP, Centre St Charles, place Victor-Hugo, 13331, Marseille, France</p>
            </ins>
            <ins id="I5">
               <p>CNRS UMR 6216, IBDML, Campus de Luminy, Route L&#233;on Lachamp, 13288, Marseille, France</p>
            </ins>
            <ins id="I6">
               <p>Genoscope (CEA), rue Gaston Cr&#233;mieux, BP5706, 91057 Evry, France</p>
            </ins>
            <ins id="I7">
               <p>CNRS, UMR 8030, rue Gaston Cr&#233;mieux, BP5706, 91057 Evry, France</p>
            </ins>
            <ins id="I8">
               <p>Universit&#233; d'Evry, Boulevard Fran&#231;ois Mitterrand, 91025, Evry, France</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>6</issue>
         <fpage>R94</fpage>
         <url>http://genomebiology.com/2008/9/6/R94</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">18533022</pubid>
               <pubid idtype="doi">10.1186/gb-2008-9-6-r94</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>5</day>
               <month>11</month>
               <year>2007</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>3</day>
               <month>3</month>
               <year>2008</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>4</day>
               <month>6</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>04</day>
               <month>06</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Marl&#233;taz et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Ch&#230;tognath genomics and evolution</p>
      </shorttitle>
      <shortabs>
         <p>The ch&#230;tognath transcriptome reveals unusual genomic features in the evolution of this protostome and suggests that it could be used as a model organism for bilaterians.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>The ch&#230;tognaths (arrow worms) have puzzled zoologists for years because of their astonishing morphological and developmental characteristics. Despite their deuterostome-like development, phylogenomic studies recently positioned the ch&#230;tognath phylum in protostomes, most likely in an early branching. This key phylogenetic position and the peculiar characteristics of ch&#230;tognaths prompted further investigation of their genomic features.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Transcriptomic and genomic data were collected from the ch&#230;tognath <it>Spadella cephaloptera </it>through the sequencing of expressed sequence tags and genomic bacterial artificial chromosome clones. Transcript comparisons at various taxonomic scales emphasized the conservation of a core gene set and phylogenomic analysis confirmed the basal position of ch&#230;tognaths among protostomes. A detailed survey of transcript diversity and individual genotyping revealed a past genome duplication event in the ch&#230;tognath lineage, which was, surprisingly, followed by a high retention rate of duplicated genes. Moreover, striking genetic heterogeneity was detected within the sampled population at the nuclear and mitochondrial levels but cannot be explained by cryptic speciation. Finally, we found evidence for trans-splicing maturation of transcripts through splice-leader addition in the ch&#230;tognath phylum and we further report that this processing is associated with operonic transcription.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>These findings reveal both shared ancestral and unique derived characteristics of the ch&#230;tognath genome, which suggests that this genome is likely the product of a very original evolutionary history. These features promote ch&#230;tognaths as a pivotal model for comparative genomics, which could provide new clues for the investigation of the evolution of animal genomes.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010008">Evolution</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010009">Genetics</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The recent shift of genomic biology from conventional model organisms to evolutionarily relevant species has led to the questioning of numerous ideas about metazoan evolution. For instance, the recently released genome of the starlet anemone has revealed a striking conservation with its vertebrate counterparts despite an apparent morphological gap between these organisms <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. On the contrary, whereas the Hox gene clusters have been considered for a long time as structures strictly required for the development of the common bilaterian body plan, they were found to be disorganized or even dislocated in animals such as nematodes or urochordates <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>. These cases illustrate the interest of genomic insights from organisms that display either peculiar morphological characteristics or have key phylogenetic positions.</p>
         <p>Interestingly, ch&#230;tognaths, also known as arrow worms, fulfill both of these criteria: they have one of the most intriguing sets of morphological and developmental characteristics among animals and their phylogenetic position was recently reevaluated as a pivotal one for the understanding of animal evolution <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. These free-living marine creatures represent one of the major predators of the zooplancton food-chain but the phylum is mainly known for its original mosaic of morphological characteristics that have puzzled zoologists for years <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. Their nervous system exhibits typical protostome features, such as ventral nervous mid-body ganglions and circum-esophageal fibers <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>, whereas the enterocoelous formation of their body cavity and the secondary emergence of their mouth are embryological features traditionally related to deuterostomes <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. Strikingly, this original body plan has been conserved since the lowermost Cambrian period as shown by convincing fossil evidence <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. First attempts to position ch&#230;tognaths using molecular phylogeny were difficult because small subunits (SSUs) and large subunits (LSUs) of ribosomal RNA genes display very fast evolutionary rates that hinder accurate tree reconstruction <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. Subsequent analysis of their mitochondrial genome prompted classification of ch&#230;tognaths among protostomes, but their exact branching in this clade remains elusive <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. The Hox genes of ch&#230;tognaths are distinct from those typical of other protostomes: their original <it>MedPost </it>gene shares similarity with both median and posterior classes <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and the posterior Hox genes that were recently identified in these animals are neither related to the AbdB nor Post1/2 classes, which are specific for ecdysozoans and lophotrochozoans, respectively <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>.</p>
         <p>Recently, the phylogenomic approach has provided the opportunity to sum up the phylogenetic signal from hundreds of genes and thereby to increase the resolution of the phylogenies <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. Two different phylogenomic studies involving different ch&#230;tognath species and based on different samples of nuclear genes have assessed the phylogenetic position of ch&#230;tognaths. They have both provided strong support for the inclusion of ch&#230;tognaths within protostomes <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>. Matus <it>et al. </it><abbrgrp><abbr bid="B19">19</abbr></abbrgrp> suggested the branching of ch&#230;tognaths at the base of lophotrochozoans on the basis of 72 nuclear genes described as valuable phylogenetic markers by Philippe <it>et al</it>. <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. Conversely, using a slightly larger taxonomic sampling and 78 ribosomal protein (RP) genes, Marl&#233;taz <it>et al. </it><abbrgrp><abbr bid="B18">18</abbr></abbrgrp> proposed that ch&#230;tognaths are the sister group of all other protostomes. This last hypothesis has deep implications for the evolution of developmental patterns among bilaterians since it promotes the view that deuterostome-like developmental features such as enterocoely or a secondary mouth opening may be ancestral among bilaterians. Interestingly, recent insights into the structure of the nervous system of ch&#230;tognaths suggest that these organisms have an intra-epidermal non-centralized nerve plexus, such as those observed in hemichordates or cnidarians <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. This is another example of a putative ancestral characteristic in this phylum. Then, both the phylogenetic position of ch&#230;tognaths and their peculiar morphology and development indicate that these organisms are pivotal for the understanding of animal evolution.</p>
         <p>The expressed sequence tag (EST) approach provides an interesting opportunity to survey genomes and to perform comparisons between organisms. For instance, whole transcriptome comparisons based on ESTs initially suggested that the gene repertory shared by all metazoans is larger than expected <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. Moreover, in regard to the unexpected genetic complexity of cnidarians, the evolutionary extent of gene losses observed in nematodes and <it>Drosophila </it>remains to be defined <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. Through their original phylogenetic position, ch&#230;tognaths offer the opportunity to check whether the ancestral protostome transcriptome has already undergone such gene losses or remains close to the ancestral bilaterian gene set conserved between vertebrates and cnidarians. Furthermore, the identification of a core set of metazoan conserved genes from a large range of organisms provides marker genes for phylogenomic analyses and signature genes as rare genomic changes, which could lead to a reevaluation of animal phylogeny <abbrgrp><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp>.</p>
         <p>Here, we describe an overview of <it>Spadella cephaloptera </it>genomics through fine-scale mining of consistent transcriptomic data. Although the morphology of ch&#230;tognaths has been extensively described, only a few molecular studies have focused on these strange organisms. The transcriptome of ch&#230;tognaths reveals a strong similarity with that of other bilaterians. This comparative framework allowed detection of molecular signatures and stressed the usefulness of RPs as marker genes for phylogenomic reconstruction. Along with the structural RNAs, RPs are major components of the ribosome translation complex <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. They constitute a set of remarkably conserved genes among eukaryotes, which have not been significantly affected by lineage-specific duplication <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. We took advantage of their high levels of expression, which allowed the assembly of a large dataset with extensive taxon sampling using ESTs. We then investigated the origin of the polymorphisms observed within the EST collection in the light of genome duplication or cryptic speciation as alternative explanatory hypotheses. Lastly, we found evidence for trans-splicing mRNA maturation in ch&#230;tognaths from this EST data. This original mRNA processing mechanism involves the addition of a spliced-leader sequence at the 5' extremity of transcripts. This mechanism has been discovered in several animal phyla by analyzing other EST collections <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. Interestingly, the occurrence of trans-splicing in ch&#230;tognaths has deep implications for the evolutionary origin and functional significance of this mechanism.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Partial transcriptome of the ch&#230;tognath <it>S. cephaloptera</it></p>
            </st>
            <p>The sequencing of an EST collection of the juvenile-staged ch&#230;tognath <it>S. cephaloptera </it>offered the opportunity to explore the transcriptome of this evolutionarily significant organism. The survey of sequence length and quality supported the accuracy of these data (Figure S1 in Additional data file 1). During these steps, we noticed that 16% of sequences match mitochondrial rRNA sequences (12S and 16S rRNAs, Figure <figr fid="F1">1</figr>) probably because the long polyadenine stretches of these rRNA molecules were isolated by the oligos-dT employed for mRNA isolation (see Materials and methods). We attempted to build clusters that gathered all transcripts from a unique gene so as to deal with a non-redundant partial transcriptome. However, the low complexity regions of some ESTs, which did not include an accurate open reading frame, hindered this process. Thus, ESTs were sorted into predicted coding and non-coding sequences using conceptual translation, and the coding transcripts were retained for comparative analyses. The overall content of the EST collection was evaluated using these steps (Figure <figr fid="F1">1</figr>). We noticed that up to 54% of the ESTs could be non-coding polyadenylated RNA, a striking figure that is, however, similar to that obtained for the human genome <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. The removal of non-coding sequences greatly improved clustering efficiency, yielding 1,447 clusters, of which 459 include more than one sequence (Figure S1 in Additional data file 1). A total of 694 of these clusters have significant matches within a protein database (TrEMBL, score >50) and 250 have clear homologs in this database with an average of 72% identity (score >150). Among the transcripts that match nuclear coding genes, the RP genes are largely represented compared to other genes similar to SwissProt entries (Figure <figr fid="F1">1</figr>).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Overall composition of the EST collection</p>
               </caption>
               <text>
                  <p>Overall composition of the EST collection. The annotation of transcripts is based on SwissProt (score >150) and led to identification of mitochondrial genes. The conceptual translation of ESTs allowed detection of those that include coding sequences. The large portion of non-coding polyadenylate nuclear transcripts and RPs among nuclear transcripts is the most prominent aspect of this distribution as well as the unexpected presence of mitochondrial rRNAs (12 and 16S) related to their polyadenine stretches.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-1"/>
            </fig>
            <p>The average gene content of the library was checked regarding functional annotation as implemented in Gene Ontology <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>. The <it>S. cephaloptera </it>library exhibited a broad diversity of functional classes with a majority of transcripts involved in metabolism or cellular activities and a non-negligible amount of transcripts involved in development (Figure S2 in Additional data file 1), which is consistent with the juvenile stage of the animals used. Hence, this EST collection contains representative, high quality sequences, providing suitable material for comparative analyses.</p>
         </sec>
         <sec>
            <st>
               <p>Gene core conservation</p>
            </st>
            <p>The set of non-redundant ch&#230;tognath transcripts was compared with several databases using the Blast program. These databases first included sets of transcripts of representative species belonging to the most important clades of bilaterians: <it>Drosophila melanogaster </it>as an ecdysozoan, <it>Lumbricus terrestris </it>as a lophotrochozoan and <it>Homo sapiens </it>as a deuterostome. These comparisons were depicted through the plotting of respective similarity scores for all transcripts that have a significant match to at least one of these species (score >150, Figure <figr fid="F2">2</figr>). This comparison demonstrated that a pool of 141 transcripts is strongly conserved between these distantly related species (Figure <figr fid="F2">2a</figr>). Conversely, 169 transcripts did not have significant matches in one or two of the species despite their strong similarity between ch&#230;tognath and the remaining species. This lack of homologs is generally imputed to extensive gene loss <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. Therefore, further comparisons were performed to identify genes whose homology assignment and gene loss in a peculiar lineage were unambiguous. Interestingly, the number of transcripts that did not match to one or more databases decreased from 169 to 74 when the complete set of sequences available for each bilaterian clade was employed as the database, instead of only one representative species (Figure <figr fid="F2">2b</figr>). The lack of homologous matches in some species could then be explained by an increase in evolutionary rates, which could have weakened the sequence similarity signal <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>. Additionally, the similarity level of matches increased when composite databases were employed (Figure <figr fid="F2">2</figr>), which supports the interest in this approach for phylogenomic reconstruction <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Visualization of relative similarity between the transcriptome of <it>S. cephaloptera </it>and <b>(a) </b>selected species or <b>(b) </b>corresponding clades: <it>H. sapiens </it>as a deuterostome, <it>D. melanogaster </it>as an ecdsyzoan and <it>L. rubellus </it>as a lophotrochozoan</p>
               </caption>
               <text>
                  <p>Visualization of relative similarity between the transcriptome of <it>S. cephaloptera </it>and <b>(a) </b>selected species or <b>(b) </b>corresponding clades: <it>H. sapiens </it>as a deuterostome, <it>D. melanogaster </it>as an ecdsyzoan and <it>L. rubellus </it>as a lophotrochozoan. The graphs are based on whole transcriptome Blast comparisons and the plotting of respective Blast scores was performed using Simitri [77] (cut-off score 150). Genes at the center of the plot are equally related to the three databases and hence represent valuable phylogenetic markers, whereas genes attracted by a node share a greater similarity with the corresponding database. Genes on the edge do not have a match in the database from the opposite vertex and those on the vertex only have a match in the corresponding database; these two types of genes constitute candidates for signature genes that have possibly been lost in a peculiar lineage. The color scale indicates the relevancy of scores.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-2"/>
            </fig>
            <p>Two classes of genes provide reliable information for phylogeny inference (Figure <figr fid="F2">2b</figr>). Those that are highly shared between distantly related taxa constitute a set of conserved genes that are valuable markers for constructing phylogenomic datasets. In parallel, the genes that lack a homologous copy in one of the considered clades represent meaningful signature genes whose loss is attributable to a discrete event <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>.</p>
            <p>The candidates for signature genes are the genes inferred to be lost in one of the investigated clades (Figure <figr fid="F2">2b</figr>). Those candidates were carefully examined and their presence checked in the largest sets of available ESTs and full genome sequences. These data include the newly sequenced full genomes of lophotrochozoans and is assumed to include an exhaustive gene set in these species. Numerous candidate genes were invalidated because their homology relationships are disputable or because a homolog was retrieved from the full genome sequences surveyed. Among these candidates, the guanidinoacetate N-methyltransferase (GAMT) enzyme was recovered in the ch&#230;tognath <it>S. cephaloptera</it>, in all studied deuterostomes, cnidarians and sister groups of metazoans (Figure S3 in Additional data file 1) but was not retrieved in any of the protostomes surveyed. Notably, this GAMT enzyme was also recovered in the acoel <it>Convoluta pulchra</it>, which was recently excluded from the protostomes <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. This enzyme catalyzes the key step of creatine synthesis, an activity that was previously checked biochemically in a variety of organisms but was not found in selected protostomes <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. GAMT was later noticed as missing in <it>D. melanogaster</it>, <it>Anopheles gambiae </it>and <it>Caeorhabditis elegans </it>genomes <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. The presence of this ancient gene provides strong evidence for an early divergence of ch&#230;tognaths from other protostomes. Indeed, the most parsimonious scenario states that this gene was lost in the protostome lineage after its split with ch&#230;tognaths <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Selection of marker genes for metazoan phylogeny</p>
            </st>
            <p>We attempted to evaluate the phylogenetic properties of the conserved genes that share equal levels of similarity with the main animal clades with respect to the convenience of their orthology assignment, their abundance in EST data and their molecular evolution properties. The main concerns when constructing phylogenomic-class datasets, especially from EST data, are the discarding of paralogous sequences, the removal of contaminants and the limitation of missing data. According to these criteria, we argue here that the set of RP genes is one of the best for setting up phylogenomic analysis in a large sample of taxa.</p>
            <p>Among the 694 ch&#230;tognath genes similar to a database entry, only 267 genes have homologs in the three main clades of bilaterians (score >150, Figure <figr fid="F2">2b</figr>). Copies of each selected marker were retrieved for all phyla studied for which EST data are available (Figure <figr fid="F3">3</figr>). In this way, the missing data were estimated through the occurrence of each gene in EST collections and preliminary phylogenetic analyses were carried out for all these independent alignments. Such controls unexpectedly highlighted putative paralogy problems for many candidate markers. If the orthologous transcript of a surveyed gene is missing in a non-exhaustive EST collection, a paralogous relative of this gene could be retrieved instead, with little chance of detection. Among candidate marker genes, RPs exhibit no ancient duplicates or out-paralogs and constitute a class of markers free from potential paralogy assignment problems <abbrgrp><abbr bid="B25">25</abbr><abbr bid="B33">33</abbr></abbrgrp>. Moreover, the gene-specific trees allowed detection of some contaminants in the EST collections, through the verification of unexpected clusterings in the tree (for example, several EST collections of parasitic organisms being contaminated by transcripts from their hosts).</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>RP minimization of missing data in EST-based phylogenomic datasets</p>
               </caption>
               <text>
                  <p>RP minimization of missing data in EST-based phylogenomic datasets. Dataset completeness was estimated for datasets composed of 78 RPs (red) or 115 other genes (green) retrieved from EST collections of a large range of sizes.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-3"/>
            </fig>
            <p>Next, the amount of missing data was estimated using these raw alignments and compared with the number of ESTs in each available collection (Figure <figr fid="F3">3</figr>). The positive correlation observed between the number of ESTs and the completeness of the dataset is stronger when dealing with a dataset composed of RPs. For instance, the 5,235 EST collection of tardigrades yielded a dataset that is 77% complete for RPs, but only 35% complete for non-ribosomal markers. Thus, their large representation in EST collections strengthens the usefulness of RPs as phylogenetic markers.</p>
         </sec>
         <sec>
            <st>
               <p>Ch&#230;tognaths within renewed metazoan phylogeny</p>
            </st>
            <p>In order to assess the branching of ch&#230;tognaths and to stress the usefulness of RP genes for phylogenomics, a RP dataset was assembled using the composite dataset approach <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. This method depends on the selection of the least diverging copy of each marker gene in each taxon, such as a phylum, and thus allows reduction of the branch lengths of composite taxa (Table S1 in Additional data file 2). To overcome previous problems, both taxon sampling and inference methods were improved. Several new phyla were included in this analysis and, in particular, numerous protostome groups: priapulids, platyhelminthes, nermerteans, ectoprocts, entoprocts and rotifers <abbrgrp><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr></abbrgrp>. Most rotifer sequences were retrieved from <it>Oryza sativa </it>(rice) ESTs, where they exist as contaminants, using their very specific splice-leader sequence as an anchor (see below and <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>). Rotifers constitute a key phylum with respect to ch&#230;tognaths because they were sometimes grouped together in the gnathifera clade on the basis of morphological criteria <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Alternatively, a splitting of lophotrochozoans into two main lineages, the platyzoans (uniting platyhelminthes and rotifers) and the trochozoans (mainly annelids, molluscs, lophophorates and nermertes) has been proposed <abbrgrp><abbr bid="B39">39</abbr><abbr bid="B40">40</abbr></abbrgrp>. Otherwise, in addition to the traditional site-homogenous WAG model, we have assessed the phylogeny of bilaterians using the site-heterogeneous CAT model, which recently improved the limitation of the long-branch attraction artifact, a common pitfall in phylogenetic reconstruction <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. The inclusion of the most recently released EST data for this large set of phyla led to a dataset including 11,730 amino acid positions and 25 taxa (Additional data file 4).</p>
            <p>The analysis of this dataset confirmed the branching of ch&#230;tognaths at the base of the protostomes with significant support values for both the site-homogeneous WAG model and the site-heterogeneous CAT model (bootstrap proportion (BP) of 76 and posterior probability (PP) of 1; Figure <figr fid="F4">4a,b</figr>). The inclusion of ch&#230;tognaths within protostomes is still firmly supported (BP 95, PP 1; Figure <figr fid="F4">4</figr>). The inclusion of new taxa strengthens support for both the ecdyozoa and lophotrochozoa clades but the exact relationships within these two clades remain elusive <abbrgrp><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr><abbr bid="B43">43</abbr></abbrgrp>. Ch&#230;tognaths and rotifers do not exhibit any peculiar affinities, prompting us to reject the gnathifera hypothesis <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Conversely, the branching of rotifers is problematic since this phylum is alternatively included in ecdysozoans and lophotrochozoans depending on the use of, respectively, site heterogeneous or homogeneous models (Figure <figr fid="F4">4</figr>). Thus, the clustering of platyhelminthes and rotifers in a platyzoa clade is supported by the WAG model but rejected by the CAT model, suggesting that this grouping may be somehow related to long-branch attraction (Figure <figr fid="F4">4</figr>). Alternatively, previous studies based on morphology and SSU genes have not argued for the ecdysozoan affinities of rotifers <abbrgrp><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr></abbrgrp>. Surprisingly, CAT model analysis no longer succeeds in recovering the monophyly of the deuterostomes (Figure <figr fid="F4">4b</figr>). Instead, it provides limited support for the successive divergence of chordates and ambulacrarians (echinoderms and hemichordates; PP 0.9; Figure <figr fid="F4">4b</figr>). This striking topology was recovered by an independent study using the same heterogeneous CAT model <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> but was neither confirmed by WAG analyses (BP 89 for the monophyly of deuterostomes; Figure <figr fid="F4">4a</figr>) nor supported on morphological bases <abbrgrp><abbr bid="B34">34</abbr><abbr bid="B38">38</abbr></abbrgrp>. One can consider that the two unexpected branchings of rotifers and deuterostomes may be related to some artifact affecting the CAT model, such as sensitivity toward compositional biases <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>. Finally, the placozoan <it>Trichoplax adherens </it>surprisingly clustered within the poriferans, as a sister group of the homoscleromorphs (BP 91, PP 0.94; Figure <figr fid="F4">4</figr>), although this poriferan status has never been suggested before <abbrgrp><abbr bid="B45">45</abbr><abbr bid="B46">46</abbr></abbrgrp>. These challenging hypotheses will be investigated in further studies because they have deep implications for the evolution of metazoans (F Marl&#233;taz <it>et al</it>., in progress).</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>The basal-protostome branching of ch&#230;tognaths is confirmed through improved inference methods and expanded taxon sampling</p>
               </caption>
               <text>
                  <p>The basal-protostome branching of ch&#230;tognaths is confirmed through improved inference methods and expanded taxon sampling. A RP alignment of 11,730 positions (after GBlock filtration; see Additional data file 4) was analyzed using two classes of models. <b>(a) </b>Site-homogeneous model (WAG) implemented in a maximum-likelihood framework (PhyML [80] and Treefinder [81]). Similar topology and maximal posterior probabilities were obtained with Bayesian analyses using the same model (MrBayes). <b>(b) </b>Site-heterogeneous model (CAT) implemented in a bayesian framework (Phylobayes [79]). Plain colored circles denote nodes for which significant support values were obtained (likelihood ratio statistics based on expected-likelihood weights (LR-ELW) >0.95 for site-homogenous and PP >0.95 for site-heterogenous). Support values are indicated for selected nodes: LR-ELW statistics and bootstrap (bold type) for maximum likelihood (ML) using the WAG model and posterior probabilities for Bayesian inference using the CAT model.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-4"/>
            </fig>
            <p>Through extended taxon sampling and improved substitution models, these analyses strongly confirm our previous statements about basal-protostome branching of ch&#230;tognaths <abbrgrp><abbr bid="B18">18</abbr></abbrgrp> and exclude the basal-lophotrochozan hypothesis <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Although some areas of bilaterian trees are sometimes incongruent depending on models and inference methods, the position of ch&#230;tognaths remains remarkably stable throughout our analyses. Furthermore, this branching is not only supported by the presence of GAMT, an unambiguous molecular signature, but also by the posterior Hox genes of ch&#230;tognaths that are not related to the classes specific to ecdysozoans (Abd-B) or lophotrochozoans (Post1/2) <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>. Finally, this topology was also recovered by independent studies involving alternative gene and taxon sampling <abbrgrp><abbr bid="B30">30</abbr><abbr bid="B35">35</abbr><abbr bid="B43">43</abbr></abbrgrp>. In a broader perspective, the strengthening of their phylogenetic position makes ch&#230;tognaths a key model for comparative genomics among bilaterians.</p>
         </sec>
         <sec>
            <st>
               <p>Genome duplication in the ch&#230;tognath phylum</p>
            </st>
            <p>The clustering of similar sequences indicated that alternative nucleotide forms are present among the transcripts encoding the same protein. Two distinct forms are observed in most cases, although three forms encode some proteins. These forms are separated by a large amount of molecular divergence and can also be distinguished by their different 5' and 3' untranslated regions (UTRs), suggesting that they correspond to different genes (Figure <figr fid="F5">5</figr> and Additional data files 5 and 6).</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Alternative forms of selected markers amplified by PCR in order to assess the origin of polymorphism</p>
               </caption>
               <text>
                  <p>Alternative forms of selected markers amplified by PCR in order to assess the origin of polymorphism. <b>(a) </b>Localization of sperm within sperm receptacles (SR) and sperm ducts (SD) in the body of ch&#230;tognath <it>S. cephaloptera </it>along with ovaries (Ov) and testis (Te). The double arrow indicates that head and body of individuals were split to perform independent PCR amplifications with the purpose of detecting possible contamination from the sperm genome. <b>(b) </b>Paralogous copies of nuclear genes RP L36 and L40 with their intron positions and average lengths, which are distinct in both cases (Additional data files 5 and 6). The names and positions of primers used for the amplification are also specified (Table S3 in Additional data file 2). <b>(c) </b>Relationships between alternative copies of Cytb retrieved within the ESTs with the three different forms detected by the designed primers (Additional data file 8). Boostrap proportions are indicated for selected nodes.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-5"/>
            </fig>
            <p>Ka/Ks ratios were calculated for all pairs of diverging forms to consider the impact of the nucleotide divergence on the protein sequences. The values of Ka/Ks range from 0.001-0.154 with a median value of 0.004, which confirmed the strong conservation of amino acid sequence despite the large synonymous substitutions observed in some cases (Ks values range from 0.8-75; Table S2 in Additional data file 2). These distinct forms were mainly retrieved for the most highly expressed genes, among which RP genes are prominent (Table <tblr tid="T1">1</tblr>). We verified that the observed molecular divergence could not be explained by the clustering of distant paralogous sequences. For the genes that have clear homologs among metazoans, the sequences of alternative forms always cluster together in phylogenetic analyses and are thus strongly separated from homologous genes of other animals. For instance, the RUX genes have undergone an ancient duplication resulting in the RUX-E and RUX-G paralogs in all metazoans. Interestingly, ch&#230;tognaths display up to three forms of RUX-E and two forms of RUX-G, all these forms being closely related (Figure S4 in Additional data file 1; Additional data file 7).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Occurrence of paralogous gene copies for ribosomal and non-ribosomal genes</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="3" ca="center">
                        <p>Ribosomal protein genes</p>
                     </c>
                     <c cspan="3" ca="center">
                        <p>Other genes</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Inferred duplicates</p>
                     </c>
                     <c ca="center">
                        <p>Gene number</p>
                     </c>
                     <c ca="center">
                        <p>Percent selected genes</p>
                     </c>
                     <c ca="center">
                        <p>Median EST number</p>
                     </c>
                     <c ca="center">
                        <p>Gene number</p>
                     </c>
                     <c ca="center">
                        <p>Percent selected genes</p>
                     </c>
                     <c ca="center">
                        <p>Median EST number</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>37%</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>70%</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>61%</p>
                     </c>
                     <c ca="center">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>15%</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2%</p>
                     </c>
                     <c ca="center">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>15%</p>
                     </c>
                     <c ca="center">
                        <p>8.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>46</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>20.5</p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>8.5</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>Such a pattern could be explained by either the duplication of a large set of genes in the genome of ch&#230;tognaths or, alternatively, it could be explained by the presence of cryptic species within the sampled population. In the first case, the observed differences would be attributed to the divergence between paralogous genes originating through the duplication, where the genome of one individual is expected to contain the two alternative nucleotide forms. In the second case, the observed genetic differences would be caused by the genetic divergence between the orthologous genes of several cryptic species spread among the population, where one individual is thus expected to contain only one of the alternative forms.</p>
            <p>This cryptic speciation hypothesis may be supported by the strong polymorphism also observed for all genes of the mitochondrial genome, which constitutes an independent lineage from the nuclear genome. For example, cytochrome b (Cytb) transcripts but also cytochrome oxydase I and III are split into distinct forms separated by large molecular distances (Figure <figr fid="F5">5c</figr>; Figure S4 in Additional data file 1; Additional data files 8-10), thus testifying to the presence of distinct mitochondrial lineages within the sampled population.</p>
            <p>To decide between these hypotheses, we designed a PCR screen to survey the alternative forms of selected markers in independent individuals. The genes for RPs L36 and L40 were targeted because they are nuclear genes displaying two alternative forms with the highest number of transcripts in the library (Table S2 in Additional data file 2). The mitochondrial Cytb gene served as an independent reference for the interpretation of results from nuclear genes. The three distinct forms of this strongly diverging mitochondrial gene were surveyed in all the individuals tested (Figure <figr fid="F5">5c</figr>). Ch&#230;tognaths are hermaphroditic and, after fertilization, they store exogenous sperm in their sperm receptacles (Figure <figr fid="F5">5a</figr>), which makes it possible to amplify the DNA from another individual. Hence, in order to detect such contamination, we performed independent amplifications on heads, which are considered free from sperm contamination, as well as on the rest of the body, which contained sperm receptacles (Figure <figr fid="F5">5a</figr>). The experimental design made it possible to detect alternative forms through the amplification of specific DNA fragments of distinct sizes (Figure <figr fid="F5">5b</figr>; Table S3 in Additional data file 2). The PCR products were characterized by sequencing and nucleotide polymorphism was subsequently carefully examined. In addition to their nucleotide divergence in coding sequences, the distinct forms of nuclear genes for RPs L36 and L40 have alternative intron positions and lengths as well as differences in their 5' and 3' UTR regions (Figure <figr fid="F5">5b</figr>).</p>
            <p>Performed on nine individuals, the amplifications revealed the presence of the two forms of the nuclear genes for RPs L36 and L40 in each individual (Table <tblr tid="T2">2</tblr>). Conversely, only one form of the mitochondrial Cytb gene was amplified in each individual with the exception of the body of individual 1, which includes two forms, thus suggesting contamination by exogenous sperm (Table <tblr tid="T2">2</tblr>). The amplification of the divergent nucleotide forms within one individual indicates that the alternative nucleotide forms correspond to paralogous nuclear copies originating through past gene duplication events (Table <tblr tid="T1">1</tblr>). Conversely, the alternative forms of the mitochondrial gene correspond to variation within the population. Because some genes, such as that encoding Translationally controlled tumor protein (TCTP), do not present paralogous copies despite their high expression levels (112 TCTP transcripts in the EST collection; Table S2 in Additional data file 2), we addressed the extent of these duplications in evaluating the quantity of duplicated genes. If the clusters of transcripts encoding the same protein include all the transcripts from alternative paralogous genes and if those paralogous genes have similar levels of expression, the probability that transcripts from these paralogous genes are represented in a given cluster is related to the size of this cluster (see Materials and methods). Hence, all the clusters that include more than six transcripts have at least a 95% chance of including transcripts from the two copies if they exist. Such clusters of transcripts were all checked for paralogous copies through sequence alignments and trees. Paralogs were detected within 35 of the 66 clusters investigated, which suggests that up to 69% of ch&#230;tognath genes are the products of duplications. These paralogs could have arisen through either a whole genome duplication (WGD) event followed by an extensive gene loss, or several segmental duplication events.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Distinct forms recovered from PCR amplification performed on heads and bodies of ten individuals for alternative marker genes</p>
               </caption>
               <tblbdy cols="8">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>L36</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>L40</p>
                     </c>
                     <c cspan="3" ca="center">
                        <p>Cytb</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Individual</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="8">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/2</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>2/2</p>
                     </c>
                     <c ca="center">
                        <p>+/2</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/2</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c ca="center">
                        <p>+/+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>A plus sign indicates that one copy was amplified and a numeral indicates the number of copies if more than one were amplified (size distinct alleles). The copies amplified in heads and bodies are separated by a slash (head/body).</p>
               </tblfn>
            </tbl>
            <p>The hypothesis of a WGD event is reinforced by the high occurrence of RPs among duplicated genes (Table <tblr tid="T1">1</tblr>). The trend to retain RP genes was previously observed after WGD for <it>Paramecium tetraurelia</it>, yeast and plants <abbrgrp><abbr bid="B47">47</abbr><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr></abbrgrp> but is not a common occurrence in small-scale duplications. Conversely, it is difficult to understand why the paralogous genes have been retained after their duplication and maintained under purifying selection as emphasized by Ka/Ks values. This conclusion is in contradiction with the current view of gene destiny after genome duplication, which alternatively predicts that one of the gene duplicates is lost or undergoes the accumulation of substitutions <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. Using a genome-level dataset, similar findings were made about the strongly duplicated genome of <it>Paramecium </it>where the retention of duplicated genes was accounted in part by dosage compensation constraints <abbrgrp><abbr bid="B47">47</abbr></abbrgrp>.</p>
            <p>The most plausible dating is that this duplication occurred before the diversification of the major ch&#230;tognath lineages. Two copies of SSU and LSU were retrieved in members of the phylum dispersed all over the tree of ch&#230;tognaths <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. Moreover, the survey of 226 ESTs available for <it>Flaccisagitta enflata </it>also revealed the presence of alternative nucleotide forms for some genes (data not shown), which would confirm that the duplication is not limited to SSU/LSU genes at this taxonomic scale. Further genome data would be required to date the duplication, for instance, in considering the Ks distribution of the set of paralogs <abbrgrp><abbr bid="B51">51</abbr></abbrgrp>, and also to definitively state the nature of the duplication through the analysis of synteny in duplicated blocks of the genome. Nevertheless, this preliminary transcriptomic survey stresses the usefulness of the ch&#230;tognaths to study phylum-level genome duplication events and the destiny of paralogous genes.</p>
         </sec>
         <sec>
            <st>
               <p>Population genomics</p>
            </st>
            <p>Beyond the molecular divergence between the coding sequences of duplicated paralogous genes, a subsequent survey of the genomic sequences of selected genes revealed that the level of polymorphism is strong within each paralogous gene (Table S4 in Additional data file 2). Multiple nucleotide substitutions as well as insertion/deletion events (indels) occurred within the introns of the four selected nuclear genes (paralogous copies of the genes for both RPs L36 and L40; Additional data files 11-14). Similarly, a large number of substitutions have accumulated in the various mitochondrial genes, thus revealing distinct mitochondrial lineages within the sampled population (Figure <figr fid="F5">5c</figr>; Figure S4 in Additional data file 1). However, these strong levels of divergence remain consistent with a population genetic structure because of the regular AT composition and the limited degree of saturation revealed by Ts/Tv ratios, singleton positions being essentially transition substitutions (Table S4 in Additional data file 2; Figure S6 in Additional data file 1).</p>
            <p>We attempted to determine the origin of this population genetic heterogeneity, which could, for instance, be due to a cryptic speciation or to a past hybridization. For this, the sequences of each individual were compared using phylogenetic trees and indels as discrete informative characteristics (Figure <figr fid="F6">6</figr>). For each marker gene, individual sequences split into several major clades supported by strong bootstrap and discrete indel events, which allows unambiguous identification of heterozygous individuals (Figure <figr fid="F6">6</figr>). For example, individual 4 is heterozygous for all markers and individuals 6, 9 and 3 are heterozygous for at least one marker. Moreover, the occurrence of several cases of putative recombinations between alleles highlights the heterozygous status of some individuals (individuals 3 and 4, Figure <figr fid="F6">6b,d</figr>). Notably, our PCR-based experimental design provided positive evidence only for heterozygosis because two amplifications (head and body) were carried out per individual, yielding 0.5 probability to detect heterozygosity. Heterozygous individuals could thus be even more abundant than observed. These heterozygous cases convincingly demonstrate that a shuffling occurs between the most divergent alleles of each gene, which constitutes strong evidence for interbreeding within the sampled population. This finding definitely excludes the possibility of cryptic speciation within this <it>S. cephaloptera </it>population. Alternatively, the panmixy hypothesis was confirmed by the unimodal distribution of pairwise divergences in mismatch analysis, which is consistent with constant population size and excludes a past hybridization event (Figure S6 in Additional data file 1). Finally, the distinct mitochondrial lineages are spread within the population but they are not correlated with any haplotype differentiation at the nuclear level, which is a strong argument against the cryptic speciation hypothesis. This type of mitochondrial diversity was previously discovered for the planktonic species <it>Sagitta setosa </it>but was also interpreted with difficulty <abbrgrp><abbr bid="B52">52</abbr></abbrgrp>.</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Relationships between haplotypes of nine individuals, including distinct head and body sequences for four marker genes, including two pairs of paralogous sequences: <b>(a) </b>L36 form 1; <b>(b) </b>L36 form 2; <b>(c) </b>L40 form 1; <b>(d) </b>L40 form 2</p>
               </caption>
               <text>
                  <p>Relationships between haplotypes of nine individuals, including distinct head and body sequences for four marker genes, including two pairs of paralogous sequences: <b>(a) </b>L36 form 1; <b>(b) </b>L36 form 2; <b>(c) </b>L40 form 1; <b>(d) </b>L40 form 2. The indels are plotted onto the branches (green lines). Noticeably, some individuals display mixed sequences from different haplotypes, which is explained by recombination events between alleles (purple star). The substitutions occurring between copies of the same allele in the head and body of individuals (blue branches) are assumed to be somatic mutations. These neighbor-joining trees were inferred assuming kimura 2 parameter distances from Additional data files 7-10. Boostrap proportions are indicated for selected nodes.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-6"/>
            </fig>
            <p>Strikingly, these comparisons also highlighted molecular divergence between the head and the body of some individuals for each of the five markers investigated (Figure <figr fid="F6">6</figr> and Additional data file 4). Such substitutions cannot be explained by a heterozygous status of those individuals because sequences from head and body were firmly clustered in the tree (Figure <figr fid="F6">6</figr>). For example, individual 4 exhibits well-separated alleles present in both head and body but intra-individual substitution took place between head and body for both of these alleles (Figure <figr fid="F6">6c</figr>). This pattern of substitutions may be explained by the occurrence of somatic mutations during the life of individuals. This interpretation is corroborated by the large extent of intra-individual substitutions in all marker genes and all individuals. Somatic mutations are considered as rare conditions, mainly known from related disorders in humans <abbrgrp><abbr bid="B53">53</abbr></abbrgrp>. Less clear are the evolutionary implications and putative benefits of this phenomenon <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>. They are sometimes suspected to play a prominent role in apoptosis and possibly in the regulation of cell division <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>. Moreover, somatic mutations have been demonstrated to be more widespread in <it>Drosophila </it>than in mammals <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>, and are sometimes correlated with extensive chromosome rearrangement in the <it>Drosophila </it>lineage <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. However, little is known about the extent and importance of this process in the non-model organisms. In the case of the ch&#230;tognath, somatic mutation could be due to the high mutation rates that seem to affect both germline and soma and could explain the divergence at the population and individual levels. The possible relationship of these accelerated mutation rates with structural reshaping of the genome after duplication deserves further evaluation.</p>
            <p>Notably, this level of somatic mutation generates a strong background noise that hinders the accurate interpretation of point mutations related to the diversity of haplotypes. Moreover, traditional hypotheses of population genetics are challenged by our findings: the genetic distances observed between individuals of a single population reach species-level without any evidence for cryptic speciation or past hybridization. In parallel, multiple mitochondrial lineages diverge and are spread and maintained within a single population <abbrgrp><abbr bid="B52">52</abbr></abbrgrp>. If such features are revealed as more widespread than expected, the data collected from numerous population genetic or phylogeographic studies require more cautious interpretation. This observation pleads for an increase of the sampling depth for population genetics, especially through genomic approaches <abbrgrp><abbr bid="B57">57</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Trans-splicing transcript maturation in ch&#230;tognaths</p>
            </st>
            <p>The survey of the ch&#230;tognath EST collection detected a common 36 nucleotide motif shared at their 5' end between transcripts from unrelated genes. Selected cases showed that these short motifs are absent from upstream genomic regions of the genes (Figure <figr fid="F7">7c</figr>; Additional data files 15-17). These findings strongly suggest that mRNA of <it>S. cephaloptera </it>undergoes trans-splicing maturation. This mRNA processing occurs through the spliceosomal transfer of a small RNA molecule at the 5' end of the mRNA from an independent spliced-leader (SL) gene and has been described in numerous species <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. To exclude the possibility of an artifact, the 226 available EST sequences of <it>F. enflata</it>, another ch&#230;tognath species, were screened using the identified SL sequences from <it>S. cephaloptera</it>. This survey led to the recovery of similar SL sequences at the 5' end of several cDNA sequences. As <it>F. enflata </it>and <it>S. cephaloptera </it>belong to the two main orders of ch&#230;tognaths <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, the trans-splicing mechanism is likely to be present in the whole ch&#230;tognath phylum.</p>
            <fig id="F7">
               <title>
                  <p>Figure 7</p>
               </title>
               <caption>
                  <p>Identified <it>S. cephaloptera </it>operon within the BAC 35YA21</p>
               </caption>
               <text>
                  <p>Identified <it>S. cephaloptera </it>operon within the BAC 35YA21. <b>(a) </b>Structure of the 158 kb BAC 35A21, including the predicted genes and the mapping of ESTs that bear SLs (purple). Detailed EST/BAC alignments are provided as Additional data files 15-17. <b>(b) </b>Detailed structure of the identified ch&#230;tognath operon with RP S14 and PCNA genes and the corresponding ESTs (purple) that exhibit SL sequences. UTR (genomic, light orange; EST, light purple) and coding sequences (genomic, orange; EST, purple). <b>(c) </b>Alignments of selected regions of the operon, beginning and end of genes showing genomic DNA (orange) and transcripts with their alternative SL forms. The very short distance encountered between the end and beginning of the two genes argues for polycistronic transcription.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-7"/>
            </fig>
            <p>An extensive study of trans-splicing in the nematode phylum has previously revealed the presence of different forms of SL sequences <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Similarly, several different SL sequences were retrieved from <it>S. cephalotera </it>(Table <tblr tid="T3">3</tblr>). This number is consistent with the strong level of polymorphism previously observed for coding sequences but two distinct SL forms alone (SL1 and SL2) represent 87% of the SL sequences (Table <tblr tid="T3">3</tblr>). These forms do not exhibit any specificity for the different paralogs since SLs are added randomly to transcripts from these paralogs (Figure <figr fid="F7">7</figr>; Additional data files 5 and 6). In an attempt to understand the evolutionary history of trans-splicing within the ch&#230;tognath phylum, the SL forms of <it>F. enflata </it>were compared with those of <it>S. cephaloptera</it>. This set of ch&#230;tognath SL sequences splits into four main forms: two of them, SL1 and SL3, are present in both the species investigated whereas the two other forms, SL2 and SL4, are specific for <it>S. cephaloptera </it>and <it>F. enflata</it>, respectively (Table <tblr tid="T3">3</tblr>). Otherwise, neither of these ch&#230;tognath SL forms display similarity with the SL of another phyla. This finding suggests that just as in nematodes, the evolution of alternative forms could have occurred at a relatively reduced taxonomic scale <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>.</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Splice-leader isoforms isolated in two ch&#230;tognath species: <it>S. cephaloptera </it>and <it>F. enflata</it></p>
               </caption>
               <tblbdy cols="5">
                  <r>
                     <c ca="left">
                        <p>Form</p>
                     </c>
                     <c ca="left">
                        <p>ID</p>
                     </c>
                     <c ca="left">
                        <p>Sequence</p>
                     </c>
                     <c ca="left">
                        <p>Species</p>
                     </c>
                     <c ca="center">
                        <p>Abundance</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Form 1</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>SL1</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTAAAATTCTTTTA--TTTGCTT-AATTAAA</p>
                     </c>
                     <c ca="left">
                        <p>Both</p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Form 2</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>SL2.0</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGAGTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>Both</p>
                     </c>
                     <c ca="center">
                        <p>70.83%</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.1</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGAGTGGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.2</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGAGCAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.3</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGACTATTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.4</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGAGTATTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1.44%</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.5</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGCGTATTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.6</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGCGTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.7</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTCATTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.8</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTCAGTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.9</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGATTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2.17%</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.10</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAACTGTTTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.11</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGACTAGTTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL2.12</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATAATTGAGTAGCTTCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Form 3</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>SL3.1</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCCAAT-TTCTACTA-CTTCACTT-GTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>F. enflata</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL3.2</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTAAT-TTCTACTA-CTTCACTT-GTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>F. enflata</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL3.3</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTAAT-ATCTACTA-CTTCACTTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>F. enflata</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Form 4</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>SL4.1</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATCAAGTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.2</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTAAGTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>16.91%</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.3</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTAAGTACTACCAAATTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.4</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTAAGTACTACCAGTTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.5</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTACGTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.6</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTAATTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.7</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTATTTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.8</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTAACTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>SL4.9</p>
                     </c>
                     <c ca="left">
                        <p>GGAAGCTTATTATTCAGTACTACCAATTTGTTTAAA</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. cephaloptera</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>&lt;</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>The abundance of the forms corresponds to the rate of the forms among all SLs and is calculated only for <it>S. cephaloptera </it>sequences. A 'less-than' sign indicates that the abundance is below 1%.</p>
               </tblfn>
            </tbl>
            <p>Within the EST collection, 2,914 sequences exhibit SL addition, which represents 30% of nuclear transcripts (Figure <figr fid="F8">8a</figr>). Among the SL population, 72% are coding transcripts, of which 46% have a homolog in SwissProt. The clustering of similar coding trans-spliced transcripts indicated that 41% of putative genes undergo SL addition. Furthermore, the relationship between trans-splicing and expression level was tested through the comparison of the number of ESTs per cluster of trans-spliced or non-trans-spliced transcripts. If we posit that this number can be considered as an estimate of the expression level, trans-spliced genes are significantly more expressed than others (Wilcoxon rank test, <it>p </it>&lt; 2.2e<sup>-16</sup>). For instance, among the 50 more expressed genes (that is, biggest EST clusters), only two are not trans-spliced. These values suggest that trans-splicing is involved in the regulation of a set of strongly expressed genes responsible for key cellular functions, for example, the RP set.</p>
            <fig id="F8">
               <title>
                  <p>Figure 8</p>
               </title>
               <caption>
                  <p>Categories of trans-spliced transcripts for ch&#230;tognath <b>(a) </b><it>S. cephaloptera </it>and <b>(b) </b>nematode <it>C. elegans</it></p>
               </caption>
               <text>
                  <p>Categories of trans-spliced transcripts for ch&#230;tognath <b>(a) </b><it>S. cephaloptera </it>and <b>(b) </b>nematode <it>C. elegans</it>. The presence of a SL sequence is related to coding properties and homologous matches in SwissProt (score >150) of the sequences. <it>C. elegans </it>exhibits less non-coding transcripts than <it>S. cephaloptera</it>.</p>
               </text>
               <graphic file="gb-2008-9-6-r94-8"/>
            </fig>
            <p>Hence, the set of trans-spliced genes of <it>S. cephaloptera </it>was compared with those of other animals that carry out this RNA maturation process (Table <tblr tid="T4">4</tblr>). Particularly, trans-splicing was characterized in the nematode <it>C. elegans </it>model, for which a large EST set is available <abbrgrp><abbr bid="B58">58</abbr><abbr bid="B59">59</abbr></abbrgrp>. These data were especially useful for extensive comparisons with <it>S. cephaloptera </it>(Figure <figr fid="F8">8b</figr>). The amount of ESTs with a SL is slightly smaller in <it>C. elegans </it>(22%) than in <it>S. cephaloptera </it>(29%) and trans-spliced transcripts are missing from the very reduced non-coding ESTs, only 5% of the total EST collection in <it>C. elegans</it>. This comparison suggests that trans-splicing is at least as widespread in <it>S. cephaloptera </it>as in <it>C. elegans</it>. Furthermore, the set of genes affected by trans-splicing in <it>S. cephaloptera </it>was comparable with those of <it>C. elegans</it>. Among the 119 different genes that are both trans-spliced and annotated using SwissProt with high confidence, 79 have trans-spliced homologous genes in <it>C. elegans </it>(Additional data file 3). These values do not include the 78 RP set, which are conserved and trans-spliced in both species. While the molecular actors involved in trans-splicing do not exhibit evolutionary conservation <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>, the genes undergoing this kind of processing could otherwise be similar in distantly related species.</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>Distribution and modalities of trans-splicing among metazoans</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="left">
                        <p>Phylum: species</p>
                     </c>
                     <c ca="center">
                        <p>Trans-splicing</p>
                     </c>
                     <c ca="center">
                        <p>Percent trans-spliced genes</p>
                     </c>
                     <c ca="center">
                        <p>Number of SL forms</p>
                     </c>
                     <c ca="center">
                        <p>Operons</p>
                     </c>
                     <c ca="center">
                        <p>Percent genes in operons</p>
                     </c>
                     <c ca="center">
                        <p>References</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cnidaria: <it>Hydra vulgaris</it></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>Very few*</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>?</p>
                     </c>
                     <c ca="center">
                        <p>NA</p>
                     </c>
                     <c ca="center">
                        <p>[85]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Urochordata (tunicate): <it>Ciona intestinalis</it></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>~2%*</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>~2%</p>
                     </c>
                     <c ca="center">
                        <p>[61]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ch&#230;tognatha: <it>Spadella cephaloptera</it>; <it>Flaccisagitta enflata</it></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>~55%</p>
                     </c>
                     <c ca="center">
                        <p>2*</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>This study</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Acoela: <it>Convoluta pulchra</it></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>>5%</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>?</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>This study</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rotifera: <it>Adineta ricciae</it>; <it>Philodina </it>sp.</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>[37]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Platyhelminth: <it>Schistosoma mansoni</it>; seven more species<sup>&#8225;</sup></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>>3%<sup>&#8224;</sup></p>
                     </c>
                     <c ca="center">
                        <p>1-2</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>ND</p>
                     </c>
                     <c ca="center">
                        <p>[60,62]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nematoda: <it>Caenothabditis elegans</it></p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>~50%</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="center">
                        <p>~20%</p>
                     </c>
                     <c ca="center">
                        <p>[58,59]</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*This figure was obtained by the analysis of a sample of several cDNA libraries sequenced from the 5' end. <sup>&#8224;</sup>This figure was obtained from 3' end sequenced cDNA libraries and may be greatly underestimated. <sup>&#8225;</sup>For a precise list of these species see [62]. NA, not applicable; ND, not determined.</p>
               </tblfn>
            </tbl>
            <p>Trans-splicing has been discovered in a set of organisms spread all over the phylogenetic tree of eukaryotes, but the molecular actors involved in this RNA maturation process do not exhibit any evolutionary conservation: the SL sequences cannot be aligned and the ribonucleoproteic machineries involved in this process have no homologs in other species <abbrgrp><abbr bid="B26">26</abbr><abbr bid="B37">37</abbr><abbr bid="B60">60</abbr><abbr bid="B61">61</abbr><abbr bid="B62">62</abbr></abbrgrp>. However, the discovery of SL trans-splicing in new animal phyla strongly argues for an ancient origin of this process, especially if these phyla have significant phylogenetic positions, such as ch&#230;tognaths or acoels. Noticeably, we also found evidence for SL addition in recently released ESTs from the acoels (unpublished observations), worm-like animals that were recently excluded from the protostomes <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. Moreover, an extensive comparison of available genomic data revealed that the set of genes undergoing trans-splicing is evolutionarily conserved between those species, which is another indication of a putative common evolutionary origin of trans-splicing (Additional data file 3 and Table <tblr tid="T4">4</tblr>).</p>
         </sec>
         <sec>
            <st>
               <p>Operonic transcription in <it>S. cephaloptera</it></p>
            </st>
            <p>In the nematode ch&#230;tognath <it>C. elegans </it>and the tunicate <it>Ciona intestinalis</it>, polycistronic mRNA molecules that contain two or more genes are transcribed from operon structures and subsequently resolved by trans-splicing <abbrgrp><abbr bid="B58">58</abbr><abbr bid="B59">59</abbr></abbrgrp>. We mined for similar eukaryotic operons in our pool of sequenced bacterial artificial chromosomes (BACs) in looking for clusters of genes with the same transcription orientation and very short intergenic regions. The trans-splicing maturation of these putative operons was confirmed by mapping the tran-spliced ESTs onto these genomic sequences. One operon including RP S14 and PCNA genes was successfully identified in the BAC 35A21 that otherwise contains a large number of genes undergoing trans-splicing (Figure <figr fid="F7">7a</figr>; Table S5 in Additional data file 2; Additional data files 15-17). EST mapping and <it>ab initio </it>gene prediction suggested that only three bases separate the polyadenylation site of the upstream RP S14 gene from the acceptor splice site at the PCNA downstream gene. This distance is even shorter than that in <it>C. intestinalis </it>operons <abbrgrp><abbr bid="B61">61</abbr></abbrgrp> and clearly excludes the possibility for a re-initiation of transcription between the genes (Figure <figr fid="F7">7c</figr>). This BAC sequence contains several other predicted genes that are closely clustered, share the same orientation and could thus belong to operonic structures (Figure <figr fid="F7">7</figr>; Table S5 in Additional data file 2). The transcripts of gene RP S14 include the two major SL 1 or 2 forms (Figure <figr fid="F7">7c</figr>). Similarly, transcripts from both paralogous copies of duplicated genes bear any of the alternative SL forms. Hence, contrary to <it>C. elegans </it>for which a SL form is specific for the upstream and the downstream genes in operons <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>, no specificity of the SL for gene position in the operon was recovered in <it>S. cephaloptera </it>(Figure <figr fid="F7">7</figr>).</p>
            <p>Hence, we have provided arguments for polycistronic transcription in another animal phylum, the ch&#230;tognaths. Animal operons have previously been described in the nematodes and in the tunicate <it>C. intestinalis </it>and were often interpreted as an adaptation to the genome size reduction observed in both these organisms <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. However, the genome size of <it>S. cephaloptera </it>is rather large at 1.05 Gb <abbrgrp><abbr bid="B63">63</abbr></abbrgrp> and the transcriptome of ch&#230;tognaths is conserved among bilaterians, in terms of gene similarity and content. Furthermore, extensive study of genes co-transcribed in <it>C. elegans </it>led to the conclusion that the operons constitute functional units in grouping genes involved in similar pathways <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>. Hence, the presence of operonic transcription in the ch&#230;tognath, a basal protostome, strongly suggests that this mechanism should be more likely considered as an original mode of gene regulation, whose evolutionary importance may have been underestimated. Thanks to the pivotal comparative genomic abilities of ch&#230;tognaths, the comparison of operon structure and content between nematodes and ch&#230;tognaths should allow the extension of the functional results obtained in <it>C. elegans </it>to a larger set of organisms, including vertebrates. Such an approach would require further genomic data in the ch&#230;tognath but will likely lead to the characterization of new gene regulatory networks, potentially leading to a better understanding of some genetic disorders <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>Ch&#230;tognaths have been formerly known for their peculiar morphological characteristics. The fine-scale analysis of transcriptomic data reported here illuminates significant genomic features of this phylum, strengthening its very original status among bilaterians. These genome features may be shuffled into opposite categories: shared ancestral characteristics of bilaterians on one hand and lineage-specific rearrangements and divergences on the other. First, the ch&#230;tognath transcriptome bears a core set of genes conserved within bilaterians. Together with recent evidence from lophotrochozoans such as annelids <abbrgrp><abbr bid="B64">64</abbr></abbrgrp>, this result confirms that the extensive gene loss previously observed within insects or nematodes cannot be extended to the whole protostome lineage. The conservation of such a core gene set was exploited for phylogenomic inference through the definition of RP genes as high-grade marker genes for phylogeny. Subsequent analyses of these marker genes confirmed the basal position of ch&#230;tognaths among protostomes, a position that has been previously supported <abbrgrp><abbr bid="B18">18</abbr><abbr bid="B30">30</abbr><abbr bid="B43">43</abbr></abbrgrp>. This position strongly impacts on the understanding of the evolution of embryological characteristics since it rejects some developmental characteristics at the stem of bilaterians, such as enterocoely or secondary mouth opening that were considered to be deuterostome-specific.</p>
         <p>This interpretation can be extended to the new genome-level characteristics that we have highlighted here. For example, the trans-splicing mechanism of mRNA processing as well as the operonic transcription depicted here were often interpreted as a secondary evolved condition related to peculiar adaptations in animals such as nematodes or tunicates <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. Contrarily, the occurrence of these mechanisms in ch&#230;tognaths and acoels suggests that their evolutionary origins may be more ancient than originally expected. Together, these findings strongly argue for the relevance of ch&#230;tognaths as a comparative genomics model because of their conserved gene set, their original phylogenetic position and their original features such as trans-splicing and operonic transcription. For example, the study of ch&#230;tognath operons could be a promising approach to identify molecular pathways involved in human genetic diseases <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>.</p>
         <p>Some genetic and genomic features of ch&#230;tognaths we have illustrated here are unique among the animals. We have discovered a genome duplication event followed by a high retention of duplicated genes that were maintained under strong purifying selection. The current view of the evolution of duplicated genes in animals or plants mainly predicts a loss of genes that have not evolved novel functions <abbrgrp><abbr bid="B50">50</abbr><abbr bid="B65">65</abbr></abbrgrp>. This view is contradicted by recent evidence from protists <abbrgrp><abbr bid="B47">47</abbr></abbrgrp>, plants <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> and the whole fungal kingdom <abbrgrp><abbr bid="B66">66</abbr></abbrgrp> that suggests new modalities of genome evolution and, in particular, strong retention and constraint of former duplicated genes. Hence, the ch&#230;tognath genome duplication deserves further documentation and investigation as one possible special case among bilaterians. Another unique feature of ch&#230;tognaths is the high level of divergence within the population. We demonstrated that this divergence is related to neither cryptic speciation nor past hybridization but conversely revealed very high mutation rates within the germ line of individuals but also within their soma. These observations have deep implications for the correct interpretation of numerous population genetics studies. This apparent genome plasticity with duplications and high mutation rates is in contrast to the strong morphological conservation of the phylum that has continued nearly unchanged since the early Cambrian period <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. This uncoupling between morphological conservation and genome plasticity makes us wonder how the gene regulatory networks responsible for the establishment of the body organization of these animals could have remained stable despite such a genome dynamic?</p>
         <p>In summary, these findings promote the study of ch&#230;tognath for orienting not only morphological but also genomic characteristics among bilaterians. With the recent rise of lophotrochozoans as promising model systems <abbrgrp><abbr bid="B67">67</abbr></abbrgrp>, the ch&#230;tognath phylum represents the next step of investigation within protostomes with its striking combination of distinct ancestral and derived features that could illuminate the evolution of bilaterians.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>cDNA library and EST sequencing</p>
            </st>
            <p>The juvenile-staged cDNA library of <it>S. cephaloptera</it>, Bush 1851 was previously described in <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. Briefly, polyA+ RNAs were isolated from hatchling to one-day-old juveniles collected in the coastal area near Marseille (Le Brusc, La Ciotat). After reverse transcription and selection of longer transcripts by size fractionation, cDNAs were cloned into Lambda Triplex 2 vector (Clontech, Palo Alto, CA, USA). There were 12,324 clones sequenced from a 5' primer at G&#233;noscope (CNS, France). A total of 390 sequences were discarded due to vector contamination or cloning artifacts, yielding a total 11,934 sequences.</p>
         </sec>
         <sec>
            <st>
               <p>BAC library</p>
            </st>
            <p>The BAC library was constructed by BioS&amp;T Inc. (Montreal, Qu&#233;bec, Canada) in the pIndigoBAC-5 vector (Epicentre, Madison, WI, USA) from adult <it>S. cephalotera </it>genomic DNA. Average insert size is 135 kb. The library was arrayed and selected clones were sequenced using a shotgun approach at G&#233;noscope.</p>
         </sec>
         <sec>
            <st>
               <p>Analysis of the EST collection</p>
            </st>
            <p>The sequences were annotated through Blast searches <abbrgrp><abbr bid="B68">68</abbr></abbrgrp> against SwissProt and TrEMBL databases. The transcripts were searched for reliable coding sequences using ESTScan and subsequently sorted into coding and non-coding sequences <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. Transcripts from the same putative genes were grouped into clusters using CLOBB <abbrgrp><abbr bid="B70">70</abbr></abbrgrp>. The functional Gene Ontology classification was retrieved from SwissProt matches using Fatigo <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>. Transcripts that bear splice-leader at their 5' extremity were searched with Blastn using the SL sequences obtained from a preliminary screen. Data parsing processes were conducted using Perl scripting language and the Bioperl resource <abbrgrp><abbr bid="B72">72</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Databases and searches for marker genes</p>
            </st>
            <p>The set of databases compared with the ch&#230;tognath transcriptome includes the transcriptomes of <it>D. melanogaster </it>and <it>H. sapiens </it>downloaded from Ensembl <abbrgrp><abbr bid="B73">73</abbr></abbrgrp>. The partial transcriptome of <it>Lumbricus rubellus </it>as well as clade-level EST databases were obtained from the NCBI EST database using appropriate keywords <abbrgrp><abbr bid="B74">74</abbr></abbrgrp>. The recently released genomes of several lophotrochozoans (<it>Capitella capitata, Helobdella robusta, Lottia gigantea, Aplysia californica</it>, <it>Schmidtea mediterranea </it>and <it>Schistosoma mansoni</it>) were accessed directly on the JGI web site <abbrgrp><abbr bid="B75">75</abbr></abbrgrp> or retrieved from the NCBI trace archive <abbrgrp><abbr bid="B76">76</abbr></abbrgrp>. The respective scores were visualized using Simitri <abbrgrp><abbr bid="B77">77</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Duplicated gene detection</p>
            </st>
            <p>All the transcript sequences encoding similar protein coding sequences were clustered on the basis of a similar SwissProt hit or a reciprocal blast hit after conceptual translation by ESTScan <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. Gene clusters were analyzed using Clustalw alignment, phylogenetic analyses and visual checking for the inclusion of potential diverging sequences (Table S1 in Additional data file 2). The minimal EST number (N) per cluster to detect the occurrence of two duplicated paralogous sequences at a 5% probability is 6 as estimated by 1 - 2(1/2)<sup>N</sup>. Ka/Ks were computed using PAML <abbrgrp><abbr bid="B78">78</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Phylogenetic analyses</p>
            </st>
            <p>The RP dataset was built using a composite database approach so as to select the least divergent sequences for each taxon <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. The species set involved in each taxon as well as the data on missing sequences are available in Table S1 in Additional data file 2. This dataset was analyzed using the CAT model as implemented in Phylobayes <abbrgrp><abbr bid="B79">79</abbr></abbrgrp>. Maximum-likelihood and Bayesian inferences were performed using PhyML <abbrgrp><abbr bid="B80">80</abbr></abbrgrp>, Treefinder <abbrgrp><abbr bid="B81">81</abbr></abbrgrp> and MrBayes <abbrgrp><abbr bid="B82">82</abbr></abbrgrp>, respectively, and both assumed a WAG+&#915;4+I model. For bayesian analyses (MrBayes and Phylobayes), at least two chains were launched, their convergence was verified and the corresponding burn-in period discarded.</p>
         </sec>
         <sec>
            <st>
               <p>PCR amplifications of duplicated markers</p>
            </st>
            <p>The individuals of <it>S. cephaloptera </it>employed for polymorphism analysis were collected across the <it>Posidonia </it>seagrass, in the calanque of Sormiou, in the coastal area near Marseille, France. Copies of nuclear RP S36 and RP L40 and mitochondrial Cytb genes were amplified by PCR using allele-specific primers (Table S3 in Additional data file 2). Genomic DNA extractions were carried out on heads and bodies of <it>S. cephaloptera </it>individuals from the calanque of Sormiou using the Wizard SV Kit (Promega, Madison, WI, USA) and PCR reactions were carried out using GoTaq polymerase (Promega). PCR conditions were defined according to the melting temperature determined for each pair of primers. Fragments were subsequently gel-purified, cloned in pGEM-T easy (Promega) and sequenced. PCR artifacts were excluded by two approaches: first, amplifications were performed on head and body of the same individual, which allows checking of the congruence between the sequences; then, the accuracy of DNA polymerase was verified by amplifying and sequencing cloned DNA. These validations were confirmed by the recovery of the amplified sequences in the EST library and by the high levels of substitutions between sequences, which are too large to be interpreted as PCR artifacts.</p>
         </sec>
         <sec>
            <st>
               <p>Population genetic analyses</p>
            </st>
            <p>Pairwise sequence comparisons and molecular evolution analyses were performed with Mega2 software assuming the kimura 2 parameters model <abbrgrp><abbr bid="B83">83</abbr></abbrgrp>. The demographic history of the populations was evaluated by mismatch analyses using Tajima's D and Fu and Li's D neutrality test implemented in DNAsp software <abbrgrp><abbr bid="B84">84</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Accession numbers</p>
            </st>
            <p>The set of sequences analyzed in this paper has been deposited in GenBank with the following accession numbers: <ext-link ext-link-type="gen" ext-link-id="CU555081">CU555081</ext-link>-<ext-link ext-link-type="gen" ext-link-id="CU563075">CU563075</ext-link> and <ext-link ext-link-type="gen" ext-link-id="CU693608">CU693608</ext-link>-<ext-link ext-link-type="gen" ext-link-id="CU693592">CU693592</ext-link> for the 11,934 ESTs, <ext-link ext-link-type="gen" ext-link-id="CU672232">CU672232</ext-link> for the BAC 35YA21, and <ext-link ext-link-type="gen" ext-link-id="EU529890">EU529890</ext-link>-<ext-link ext-link-type="gen" ext-link-id="EU529968">EU529968</ext-link> for the sequences of RP L36 and L40 paralogs in nine individuals (Table <tblr tid="T2">2</tblr>).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>BAC, bacterial artificial chromosome; BP, bootstrap proportion; Cytb, cytochrome b; EST, expressed sequence tag; GAMT, guanidinoacetate N-methyltransferase; indels, insertion or deletion events; LSU, large subunit of ribosomal RNA; PP, posterior probability; RP, ribosomal protein; 
SL, splice-leader; SSU, small subunit of ribosomal RNA; UTR, untranslated region; WGD, whole genome duplication.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>YLP and FM conceived the project and performed the analyses focused on phylogenomics, characterization of duplication and trans-splicing. YLP and XC were in charge of the construction of the cDNA and BAC libraries. YLP, FM, and AG carried out the experiments related to the study of polymorphism in the population. YP ensured the collection of animals required for construction of libraries and population genetics studies. PW supervised the sequencing project that SS, CD and GG carried out. FM wrote the paper and all authors agreed on the final version.</p>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available. Additional data file <supplr sid="S1">1</supplr> includes supplementary Figures S1-S6 with legends: EST library statistics (Figure S1), Gene Ontology annotation (Figure S2), alignment of GAMT in selected taxa (Figure S3), trees illustrating the divergence between copies of nuclear and mitochondrial genes in the library (Figure S4), transition versus transversion ratios for the five targeted genes (Figure S5), and mismatch analyses and testing for the five targeted genes (Figure S6). Additional data file <supplr sid="S2">2</supplr> includes supplementary Tables S1-S5 with legends: composition of the composite taxa involved in phylogenomic analyses (Table S1), list of all clusters of transcripts corresponding to alternative forms or not with Ka/Ks ratios (Table S2), list of primers employed for PCR amplifications of alternative forms (Table S3), comparison of molecular evolution trends for four genes retrieved in nine individuals (Table S4), and annotation of the BAC 35A21 (Table S5). Additional data file <supplr sid="S3">3</supplr> lists the trans-spliced genes conserved between <it>S. cephaloptera </it>and <it>C. elegans </it>andhomologous to a SwissProt entry (Figure S6 in Additional data file <supplr sid="S1">1</supplr>). Additional data file <supplr sid="S4">4</supplr> is the concatenated gblocked alignment that clusters 77 RPs, yielding 24 taxa and 11,730 shuffled amino acid positions. This dataset was employed for phylogenomic reconstruction. Additional data files <supplr sid="S5">5</supplr> and <supplr sid="S6">6</supplr> are the transcript sequences of RP L36 (Additional data file <supplr sid="S5">5</supplr>) and RP L40 (Additional data file <supplr sid="S6">6</supplr>) exhibiting the alternative forms corresponding to paralogous copies and the position of primers designed to specifically amplify these forms. Additional data file <supplr sid="S7">7</supplr> is the alignment of amino acid sequences of RUX paralogs and variants from <it>S. cephaloptera </it>and some other eukaryotic taxa. Additional data file <supplr sid="S8">8</supplr> is the alignment of Cytb displaying selected variants retrieved from the EST library and the coding sequences of Cytb from nine individuals showing the differences between genetic lineages within the population (primers employed for the specific amplifications are included). Additional data files <supplr sid="S9">9</supplr> and <supplr sid="S10">10</supplr> are the alignments of cytochrome oxydase I and III transcripts retrieved from the EST library. Additional data files <supplr sid="S11">11</supplr>, <supplr sid="S12">12</supplr>, <supplr sid="S13">13</supplr> and <supplr sid="S14">14</supplr> are the alignments of genomic sequence of paralogs of RP L36 (paralogs 1 and 2, Additional data files <supplr sid="S11">11</supplr> and <supplr sid="S12">12</supplr>) and RP L40 (paralogs 1 and 2, Additional data files <supplr sid="S13">13</supplr> and <supplr sid="S14">14</supplr>) from 9 individuals that have been amplified from the body (B) or head (H) of individuals as indicated in the sequence name. Additional data files <supplr sid="S15">15</supplr>, <supplr sid="S16">16</supplr> and <supplr sid="S17">17</supplr> are EST/BAC alignments for four trans-spliced genes present in BAC 35A21, whose transcripts are represented in the EST library. Additional data file <supplr sid="S15">15</supplr> contains the RP S14 and PCNA genes gathered in an operonic structure and eight matching ESTs. Additional data file <supplr sid="S16">16</supplr> contains the COP9 gene and two matching ESTs. Additional data file <supplr sid="S17">17</supplr> contains an unidentified gene matching EST clones 6YJ23. All these alignments clearly exhibit lack of a SL motif in the genomic sequence.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Supplementary Figures S1-S6</p>
            </caption>
            <text>
               <p>Figure S1: EST library statistics. Figure S2: Gene Ontology annotation. Figure S3: alignment of GAMT in selected taxa. Figure S4: trees illustrating the divergence between copies of nuclear and mitochondrial genes in the library. Figure S5: transition versus transversion ratios for the five targeted genes. Figure S6: mismatch analyses and testing for the five targeted genes.</p>
            </text>
            <file name="gb-2008-9-6-r94-S1.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Supplementary Tables S1-S5</p>
            </caption>
            <text>
               <p>Table S1: composition of the composite taxa involved in phylogenomic analyses. Table S2: list of all clusters of transcripts corresponding to alternative forms or not with Ka/Ks ratios. Table S3: list of primers employed for PCR amplifications of alternative forms. Table S4: comparison of molecular evolution trends for four genes retrieved in nine individuals. Table S5: annotation of the BAC 35A21.</p>
            </text>
            <file name="gb-2008-9-6-r94-S2.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Trans-spliced genes conserved between <it>S. cephaloptera </it>and <it>C. elegans </it>and homologous to a SwissProt entry</p>
            </caption>
            <text>
               <p>Trans-spliced genes conserved between <it>S. cephaloptera </it>and <it>C. elegans </it>and homologous to a SwissProt entry (Figure S6 in Additional data file <supplr sid="S1">1</supplr>).</p>
            </text>
            <file name="gb-2008-9-6-r94-S3.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Concatenated gblocked alignment that clusters 77 RPs, yielding 24 taxa and 11,730 shuffled amino acid positions</p>
            </caption>
            <text>
               <p>This dataset was employed for phylogenomic reconstruction.</p>
            </text>
            <file name="gb-2008-9-6-r94-S4.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>Transcript sequences of RP L36 exhibiting the alternative forms corresponding to paralogous copies and the position of primers designed to specifically amplify these forms</p>
            </caption>
            <text>
               <p>Transcript sequences of RP L36 exhibiting the alternative forms corresponding to paralogous copies and the position of primers designed to specifically amplify these forms.</p>
            </text>
            <file name="gb-2008-9-6-r94-S5.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>Transcript sequences of RP L40 exhibiting the alternative forms corresponding to paralogous copies and the position of primers designed to specifically amplify these forms</p>
            </caption>
            <text>
               <p>Transcript sequences of RP L40 exhibiting the alternative forms corresponding to paralogous copies and the position of primers designed to specifically amplify these forms.</p>
            </text>
            <file name="gb-2008-9-6-r94-S6.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>Alignment of amino acid sequences of RUX paralogs and variants from <it>S. cephaloptera </it>and some other eukaryotic taxa</p>
            </caption>
            <text>
               <p>Alignment of amino acid sequences of RUX paralogs and variants from <it>S. cephaloptera </it>and some other eukaryotic taxa.</p>
            </text>
            <file name="gb-2008-9-6-r94-S7.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S8">
            <title>
               <p>Additional data file 8</p>
            </title>
            <caption>
               <p>Alignment of Cytb displaying selected variants retrieved from the EST library and the coding sequences of Cytb from nine individuals showing the differences between genetic lineages within the population</p>
            </caption>
            <text>
               <p>Primers employed for the specific amplifications are included.</p>
            </text>
            <file name="gb-2008-9-6-r94-S8.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S9">
            <title>
               <p>Additional data file 9</p>
            </title>
            <caption>
               <p>Alignment of cytochrome oxydase I transcripts retrieved from the EST library</p>
            </caption>
            <text>
               <p>Alignment of cytochrome oxydase I transcripts retrieved from the EST library.</p>
            </text>
            <file name="gb-2008-9-6-r94-S9.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S10">
            <title>
               <p>Additional data file 10</p>
            </title>
            <caption>
               <p>Alignment of cytochrome oxydase III transcripts retrieved from the EST library</p>
            </caption>
            <text>
               <p>Alignment of cytochrome oxydase III transcripts retrieved from the EST library.</p>
            </text>
            <file name="gb-2008-9-6-r94-S10.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S11">
            <title>
               <p>Additional data file 11</p>
            </title>
            <caption>
               <p>Alignments of genomic sequences of paralogs of RP L36 (paralog 1) from nine individuals</p>
            </caption>
            <text>
               <p>Sequences were amplified from the body (B) or head (H) of individuals as indicated in the sequence name.</p>
            </text>
            <file name="gb-2008-9-6-r94-S11.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S12">
            <title>
               <p>Additional data file 12</p>
            </title>
            <caption>
               <p>Alignments of genomic sequences of paralogs of RP L36 (paralog 2) from nine individuals</p>
            </caption>
            <text>
               <p>Sequences were amplified from the body (B) or head (H) of individuals as indicated in the sequence name.</p>
            </text>
            <file name="gb-2008-9-6-r94-S12.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S13">
            <title>
               <p>Additional data file 13</p>
            </title>
            <caption>
               <p>Alignments of genomic sequences of paralogs of RP L40 (paralog 1) from nine individuals</p>
            </caption>
            <text>
               <p>Sequences were amplified from the body (B) or head (H) of individuals as indicated in the sequence name.</p>
            </text>
            <file name="gb-2008-9-6-r94-S13.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S14">
            <title>
               <p>Additional data file 14</p>
            </title>
            <caption>
               <p>Alignments of genomic sequences of paralogs of RP L40 (paralog 2) from nine individuals</p>
            </caption>
            <text>
               <p>Sequences were amplified from the body (B) or head (H) of individuals as indicated in the sequence name.</p>
            </text>
            <file name="gb-2008-9-6-r94-S14.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S15">
            <title>
               <p>Additional data file 15</p>
            </title>
            <caption>
               <p>EST/BAC alignment trans-spliced genes present in BAC 35A21: RP S14 and PCNA genes gathered in an operonic structure and eight matching ESTs</p>
            </caption>
            <text>
               <p>All the alignments in Additional data files <supplr sid="S15">15</supplr>, <supplr sid="S16">16</supplr>, <supplr sid="S17">17</supplr> clearly exhibit lack of a SL motif in the genomic sequence.</p>
            </text>
            <file name="gb-2008-9-6-r94-S15.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S16">
            <title>
               <p>Additional data file 16</p>
            </title>
            <caption>
               <p>EST/BAC alignment trans-spliced genes present in BAC 35A21: the COP9 gene and two matching ESTs</p>
            </caption>
            <text>
               <p>All the alignments in Additional data files <supplr sid="S15">15</supplr>, <supplr sid="S16">16</supplr>, <supplr sid="S17">17</supplr> clearly exhibit lack of a SL motif in the genomic sequence.</p>
            </text>
            <file name="gb-2008-9-6-r94-S16.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S17">
            <title>
               <p>Additional data file 17</p>
            </title>
            <caption>
               <p>EST/BAC alignment trans-spliced genes present in BAC 35A21: an unidentified gene matching EST clones 6YJ23</p>
            </caption>
            <text>
               <p>All the alignments in Additional data files <supplr sid="S15">15</supplr>, <supplr sid="S16">16</supplr>, <supplr sid="S17">17</supplr> clearly exhibit lack of a SL motif in the genomic sequence.</p>
            </text>
            <file name="gb-2008-9-6-r94-S17.fast">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank Bastien Boussau and C&#233;dric Finet for their insightful comments on the manuscript. We also thank Eliane Alivon for her help in the molecular biology experiments, Susan Cure and Andy Saurin for correcting the manuscript. This work was supported by the GIS G&#233;nomique Marine (CNRS), the Consortium National de Recherche en G&#233;nomique, BQR from Universit&#233; de Provence and Universit&#233; de la M&#233;diterran&#233;e. FM is supported by a BDI CNRS Fellowship.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Sea anemone genome reveals ancestral eumetazoan gene repertoire and genomic organization.</p>
            </title>
            <aug>
               <au>
                  <snm>Putnam</snm>
                  <fnm>NH</fnm>
               </au>
               <au>
                  <snm>Srivastava</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hellsten</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Dirks</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Salamov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Terry</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Shapiro</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lindquist</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Kapitonov</snm>
                  <fnm>VV</fnm>
               </au>
               <au>
                  <snm>Jurka</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Genikhovich</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Grigoriev</snm>
                  <fnm>IV</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Steele</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Finnerty</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Technau</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Martindale</snm>
                  <fnm>MQ</fnm>
               </au>
               <au>
                  <snm>Rokhsar</snm>
                  <fnm>DS</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2007</pubdate>
            <volume>317</volume>
            <fpage>86</fpage>
            <lpage>94</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1139158</pubid>
                  <pubid idtype="pmpid" link="fulltext">17615350</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The rise and fall of Hox gene clusters.</p>
            </title>
            <aug>
               <au>
                  <snm>Duboule</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Development</source>
            <pubdate>2007</pubdate>
            <volume>134</volume>
            <fpage>2549</fpage>
            <lpage>2560</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1242/dev.001065</pubid>
                  <pubid idtype="pmpid" link="fulltext">17553908</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Hox cluster disintegration with persistent anteroposterior order of expression in <it>Oikopleura dioica</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Seo</snm>
                  <fnm>HC</fnm>
               </au>
               <au>
                  <snm>Edvardsen</snm>
                  <fnm>RB</fnm>
               </au>
               <au>
                  <snm>Maeland</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Bjordal</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jensen</snm>
                  <fnm>MF</fnm>
               </au>
               <au>
                  <snm>Hansen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Flaat</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Weissenbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lehrach</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Reinhardt</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Chourrout</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>431</volume>
            <fpage>67</fpage>
            <lpage>71</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature02709</pubid>
                  <pubid idtype="pmpid" link="fulltext">15343333</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Phylogeny: the continuing classificatory conundrum of chaetognaths.</p>
            </title>
            <aug>
               <au>
                  <snm>Ball</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>R593</fpage>
            <lpage>R596</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2006.07.006</pubid>
                  <pubid idtype="pmpid" link="fulltext">16890517</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <aug>
               <au>
                  <snm>Hyman</snm>
                  <fnm>LH</fnm>
               </au>
            </aug>
            <source>The Invertebrates, Vol. 5, Smaller Coelomate Groups</source>
            <publisher>New York: McGraw-Hill</publisher>
            <pubdate>1959</pubdate>
         </bibl>
         <bibl id="B6">
            <title>
               <p>A new look at the ventral nerve centre of Sagitta: implications for the phylogenetic position of Chaetognatha (arrow worms) and the evolution of the bilaterian nervous system.</p>
            </title>
            <aug>
               <au>
                  <snm>Harzsch</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Muller</snm>
                  <fnm>CH</fnm>
               </au>
            </aug>
            <source>Front Zool</source>
            <pubdate>2007</pubdate>
            <volume>4</volume>
            <fpage>14</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1885248</pubid>
                  <pubid idtype="pmpid" link="fulltext">17511857</pubid>
                  <pubid idtype="doi">10.1186/1742-9994-4-14</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>The unique embryology of Chaetognatha.</p>
            </title>
            <aug>
               <au>
                  <snm>Kapp</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Zool Anz</source>
            <pubdate>2000</pubdate>
            <volume>239</volume>
            <fpage>263</fpage>
            <lpage>266</lpage>
         </bibl>
         <bibl id="B8">
            <title>
               <p>A possible Lower Cambrian chaetognath (arrow worm).</p>
            </title>
            <aug>
               <au>
                  <snm>Chen</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>DY</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>298</volume>
            <fpage>187</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1075059</pubid>
                  <pubid idtype="pmpid" link="fulltext">12364798</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Early Cambrian origin of modern food webs: evidence from predator arrow worms.</p>
            </title>
            <aug>
               <au>
                  <snm>Vannier</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Steiner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Renvois&#233;</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>SX</fnm>
               </au>
               <au>
                  <snm>Casanova</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Proc Biol Sci</source>
            <pubdate>2007</pubdate>
            <volume>274</volume>
            <fpage>627</fpage>
            <lpage>633</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2197202</pubid>
                  <pubid idtype="pmpid" link="fulltext">17254986</pubid>
                  <pubid idtype="doi">10.1098/rspb.2006.3761</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Systematics of Chaetognatha under the light of molecular data, using duplicated ribosomal 18S DNA sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Papillon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Caubit</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Le Parco</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Mol Phylogenet Evol</source>
            <pubdate>2006</pubdate>
            <volume>38</volume>
            <fpage>621</fpage>
            <lpage>634</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.ympev.2005.12.004</pubid>
                  <pubid idtype="pmpid" link="fulltext">16434216</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The phylogenetic affinities of the chaetognaths: a molecular analysis.</p>
            </title>
            <aug>
               <au>
                  <snm>Telford</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>PW</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1993</pubdate>
            <volume>10</volume>
            <fpage>660</fpage>
            <lpage>676</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8336548</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Evolution of 28S ribosomal DNA in chaetognaths: duplicate genes and molecular phylogeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Telford</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>PW</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>1997</pubdate>
            <volume>44</volume>
            <fpage>135</fpage>
            <lpage>144</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/PL00006130</pubid>
                  <pubid idtype="pmpid" link="fulltext">9069174</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>The mitochondrial genome of <it>Paraspadella gotoi </it>is highly reduced and reveals that chaetognaths are a sister group to protostomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Helfenbein</snm>
                  <fnm>KG</fnm>
               </au>
               <au>
                  <snm>Fourcade</snm>
                  <fnm>HM</fnm>
               </au>
               <au>
                  <snm>Vanjani</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Boore</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>10639</fpage>
            <lpage>10643</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">489987</pubid>
                  <pubid idtype="pmpid" link="fulltext">15249679</pubid>
                  <pubid idtype="doi">10.1073/pnas.0400941101</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Identification of chaetognaths as protostomes is supported by the analysis of their mitochondrial genome.</p>
            </title>
            <aug>
               <au>
                  <snm>Papillon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Caubit</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Le Parco</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2004</pubdate>
            <volume>21</volume>
            <fpage>2122</fpage>
            <lpage>2129</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msh229</pubid>
                  <pubid idtype="pmpid" link="fulltext">15306659</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Hox gene survey in the chaetognath <it>Spadella cephaloptera</it>: evolutionary implications.</p>
            </title>
            <aug>
               <au>
                  <snm>Papillon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Fasano</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Le Parco</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Caubit</snm>
                  <fnm>X</fnm>
               </au>
            </aug>
            <source>Dev Genes Evol</source>
            <pubdate>2003</pubdate>
            <volume>213</volume>
            <fpage>142</fpage>
            <lpage>148</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12690453</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>The <it>Hox</it> gene complement of a pelagic chaetognath, <it>Flaccisagitta enflata</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Matus</snm>
                  <fnm>DQ</fnm>
               </au>
               <au>
                  <snm>Halanych</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Martindale</snm>
                  <fnm>MQ</fnm>
               </au>
            </aug>
            <source>Integr Comp Biol</source>
            <pubdate>2007</pubdate>
            <volume>47</volume>
            <fpage>854</fpage>
            <lpage>864</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/icb/icm077</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Phylogenomics and the reconstruction of the tree of life.</p>
            </title>
            <aug>
               <au>
                  <snm>Delsuc</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Brinkmann</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <fpage>361</fpage>
            <lpage>375</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg1603</pubid>
                  <pubid idtype="pmpid" link="fulltext">15861208</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Chaetognath phylogenomics: a protostome with deuterostome-like development.</p>
            </title>
            <aug>
               <au>
                  <snm>Marl&#233;taz</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Papillon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Caubit</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Freeman</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Fasano</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Dossat</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Weissenbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Le Parco</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>R577</fpage>
            <lpage>R578</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2006.07.016</pubid>
                  <pubid idtype="pmpid" link="fulltext">16890510</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Broad taxon and gene sampling indicate that chaetognaths are protostomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Matus</snm>
                  <fnm>DQ</fnm>
               </au>
               <au>
                  <snm>Copley</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Dunn</snm>
                  <fnm>CW</fnm>
               </au>
               <au>
                  <snm>Hejnol</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Eccleston</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Halanych</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Martindale</snm>
                  <fnm>MQ</fnm>
               </au>
               <au>
                  <snm>Telford</snm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>R575</fpage>
            <lpage>R576</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2006.07.017</pubid>
                  <pubid idtype="pmpid" link="fulltext">16890509</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Multigene analyses of bilaterian animals corroborate the monophyly of Ecdysozoa, Lophotrochozoa, and Protostomia.</p>
            </title>
            <aug>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lartillot</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Brinkmann</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <fpage>1246</fpage>
            <lpage>1253</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi111</pubid>
                  <pubid idtype="pmpid" link="fulltext">15703236</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>EST analysis of the cnidarian <it>Acropora millepora </it>reveals extensive gene loss and rapid sequence divergence in the model invertebrates.</p>
            </title>
            <aug>
               <au>
                  <snm>Kortschak</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Samuel</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Saint</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <fpage>2190</fpage>
            <lpage>2195</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2003.11.030</pubid>
                  <pubid idtype="pmpid" link="fulltext">14680636</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Large-scale sequencing and the new animal phylogeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Telford</snm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>Trends Ecol Evol</source>
            <pubdate>2006</pubdate>
            <volume>21</volume>
            <fpage>614</fpage>
            <lpage>620</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tree.2006.08.004</pubid>
                  <pubid idtype="pmpid" link="fulltext">16919363</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Rare genomic changes as a tool for phylogenetics.</p>
            </title>
            <aug>
               <au>
                  <snm>Rokas</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>PW</fnm>
               </au>
            </aug>
            <source>Trends Ecol Evol</source>
            <pubdate>2000</pubdate>
            <volume>15</volume>
            <fpage>454</fpage>
            <lpage>459</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0169-5347(00)01967-4</pubid>
                  <pubid idtype="pmpid" link="fulltext">11050348</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Structure and function of the eukaryotic ribosome: the next frontier.</p>
            </title>
            <aug>
               <au>
                  <snm>Doudna</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Rath</snm>
                  <fnm>VL</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2002</pubdate>
            <volume>109</volume>
            <fpage>153</fpage>
            <lpage>156</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(02)00725-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">12007402</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Modeling gene and genome duplications in eukaryotes.</p>
            </title>
            <aug>
               <au>
                  <snm>Maere</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>De Bodt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Raes</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Casneuf</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kuiper</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Van de Peer</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <fpage>5454</fpage>
            <lpage>5459</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">556253</pubid>
                  <pubid idtype="pmpid" link="fulltext">15800040</pubid>
                  <pubid idtype="doi">10.1073/pnas.0501102102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>SL trans-splicing: easy come or easy go?</p>
            </title>
            <aug>
               <au>
                  <snm>Hastings</snm>
                  <fnm>KE</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>240</fpage>
            <lpage>247</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tig.2005.02.005</pubid>
                  <pubid idtype="pmpid" link="fulltext">15797620</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Genome-wide transcription and the implications for genomic organization.</p>
            </title>
            <aug>
               <au>
                  <snm>Kapranov</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Willingham</snm>
                  <fnm>AT</fnm>
               </au>
               <au>
                  <snm>Gingeras</snm>
                  <fnm>TR</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>413</fpage>
            <lpage>423</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg2083</pubid>
                  <pubid idtype="pmpid" link="fulltext">17486121</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Large-scale protein annotation through gene ontology.</p>
            </title>
            <aug>
               <au>
                  <snm>Xie</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wasserman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Levine</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Novik</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Grebinskiy</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Shoshan</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mintz</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>785</fpage>
            <lpage>794</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">186564</pubid>
                  <pubid idtype="pmpid" link="fulltext">11997345</pubid>
                  <pubid idtype="doi">10.1101/gr.86902</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>A transcriptomic analysis of the phylum Nematoda.</p>
            </title>
            <aug>
               <au>
                  <snm>Parkinson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Mitreva</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Whitton</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Thomson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Daub</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schmid</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Waterston</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>McCarter</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Blaxter</snm>
                  <fnm>ML</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2004</pubdate>
            <volume>36</volume>
            <fpage>1259</fpage>
            <lpage>1267</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/ng1472</pubid>
                  <pubid idtype="pmpid" link="fulltext">15543149</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Acoel flatworms are not platyhelminthes: evidence from phylogenomics.</p>
            </title>
            <aug>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Brinkmann</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Martinez</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Riutort</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bagu&#241;&#224;</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>PLoS ONE</source>
            <pubdate>2007</pubdate>
            <volume>2</volume>
            <fpage>e717</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1933604</pubid>
                  <pubid idtype="pmpid" link="fulltext">17684563</pubid>
                  <pubid idtype="doi">10.1371/journal.pone.0000717</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Distribution of creatine, guanidinoacetate and the enzymes for their biosynthesis in the animal kingdom. Implications for phylogeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Van Pilsum</snm>
                  <fnm>JF</fnm>
               </au>
               <au>
                  <snm>Stephens</snm>
                  <fnm>GC</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Biochem J</source>
            <pubdate>1972</pubdate>
            <volume>126</volume>
            <fpage>325</fpage>
            <lpage>345</lpage>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Comparative genome and proteome analysis of <it>Anopheles gambiae </it>and <it>Drosophila melanogaster</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Zdobnov</snm>
                  <fnm>EM</fnm>
               </au>
               <au>
                  <snm>von Mering</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Letunic</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Torrents</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Suyama</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Copley</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Christophides</snm>
                  <fnm>GK</fnm>
               </au>
               <au>
                  <snm>Thomasova</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Holt</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Subramanian</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Mueller</snm>
                  <fnm>HM</fnm>
               </au>
               <au>
                  <snm>Dimopoulos</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Law</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Wells</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Charlab</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Kokoza</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Kraft</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Louis</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Barillas-Mury</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nusskern</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Rubin</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Topalis</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wides</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <etal/>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>298</volume>
            <fpage>149</fpage>
            <lpage>159</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1077061</pubid>
                  <pubid idtype="pmpid" link="fulltext">12364792</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Orthology, paralogy and proposed classification for paralog subtypes.</p>
            </title>
            <aug>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>EL</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2002</pubdate>
            <volume>18</volume>
            <fpage>619</fpage>
            <lpage>620</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(02)02793-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">12446146</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Deuterostome phylogeny reveals monophyletic chordates and the new phylum Xenoturbellida.</p>
            </title>
            <aug>
               <au>
                  <snm>Bourlat</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Juliusdottir</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Freeman</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Aronowicz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kirschner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lander</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Thorndyke</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nakano</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kohn</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Heyland</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Moroz</snm>
                  <fnm>LL</fnm>
               </au>
               <au>
                  <snm>Copley</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Telford</snm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2006</pubdate>
            <volume>444</volume>
            <fpage>85</fpage>
            <lpage>88</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature05241</pubid>
                  <pubid idtype="pmpid" link="fulltext">17051155</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Spiralian phylogenomics supports the resurrection of Bryozoa comprising Ectoprocta and Entoprocta.</p>
            </title>
            <aug>
               <au>
                  <snm>Hausdorf</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Helmkampf</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Meyer</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Witek</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Herlyn</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Bruchhaus</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hankeln</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Struck</snm>
                  <fnm>TH</fnm>
               </au>
               <au>
                  <snm>Lieb</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>2723</fpage>
            <lpage>2729</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msm214</pubid>
                  <pubid idtype="pmpid" link="fulltext">17921486</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Phylogenetic position of Nemertea derived from phylogenomic data.</p>
            </title>
            <aug>
               <au>
                  <snm>Struck</snm>
                  <fnm>TH</fnm>
               </au>
               <au>
                  <snm>Fisse</snm>
                  <fnm>F</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2008</pubdate>
            <volume>25</volume>
            <fpage>728</fpage>
            <lpage>736</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msn019</pubid>
                  <pubid idtype="pmpid" link="fulltext">18222945</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Spliced leader RNA-mediated trans-splicing in phylum Rotifera.</p>
            </title>
            <aug>
               <au>
                  <snm>Pouchkina-Stantcheva</snm>
                  <fnm>NN</fnm>
               </au>
               <au>
                  <snm>Tunnacliffe</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <fpage>1482</fpage>
            <lpage>1489</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi139</pubid>
                  <pubid idtype="pmpid" link="fulltext">15788744</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <aug>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Animal Evolution: Interelationships of the Living Phyla</source>
            <publisher>New York: Oxford University Press</publisher>
            <pubdate>2001</pubdate>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Triploblastic relationships with emphasis on the acoelomates and the position of Gnathostomulida, Cycliophora, Plathelminthes, and Chaetognatha: a combined approach of 18S rDNA sequences and morphology.</p>
            </title>
            <aug>
               <au>
                  <snm>Giribet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Distel</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Polz</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sterrer</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wheeler</snm>
                  <fnm>WC</fnm>
               </au>
            </aug>
            <source>Syst Biol</source>
            <pubdate>2000</pubdate>
            <volume>49</volume>
            <fpage>539</fpage>
            <lpage>562</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1080/10635159950127385</pubid>
                  <pubid idtype="pmpid">12116426</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>The new view of animal phylogeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Halanych</snm>
                  <fnm>KM</fnm>
               </au>
            </aug>
            <source>Annu Rev Ecol Evol Syst</source>
            <pubdate>2004</pubdate>
            <volume>35</volume>
            <fpage>229</fpage>
            <lpage>256</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.ecolsys.35.112202.130124</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Lack of resolution in the animal phylogeny: closely spaced cladogeneses or undetected systematic errors?</p>
            </title>
            <aug>
               <au>
                  <snm>Baurain</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Brinkmann</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>6</fpage>
            <lpage>9</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msl137</pubid>
                  <pubid idtype="pmpid" link="fulltext">17012374</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Suppression of long-branch attraction artefacts in the animal phylogeny using a site-heterogeneous model.</p>
            </title>
            <aug>
               <au>
                  <snm>Lartillot</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Brinkmann</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>BMC Evol Biol</source>
            <pubdate>2007</pubdate>
            <volume>7</volume>
            <issue>Suppl 1</issue>
            <fpage>S4</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1796613</pubid>
                  <pubid idtype="pmpid" link="fulltext">17288577</pubid>
                  <pubid idtype="doi">10.1186/1471-2148-7-S1-S4</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>Improvement of molecular phylogenetic inference and the phylogeny of Bilateria.</p>
            </title>
            <aug>
               <au>
                  <snm>Lartillot</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Philos Trans R Soc Lond B Biol Sci</source>
            <pubdate>2008</pubdate>
            <volume>363</volume>
            <fpage>1463</fpage>
            <lpage>1472</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">18192187</pubid>
                  <pubid idtype="doi">10.1098/rstb.2007.2236</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>A site- and time-heterogeneous model of amino-acid replacement.</p>
            </title>
            <aug>
               <au>
                  <snm>Blanquart</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lartillot</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2008</pubdate>
            <volume>25</volume>
            <fpage>842</fpage>
            <lpage>858</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msn018</pubid>
                  <pubid idtype="pmpid" link="fulltext">18234708</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Mitochondrial genome of <it>Trichoplax adhaerens </it>supports placozoa as the basal lower metazoan phylum.</p>
            </title>
            <aug>
               <au>
                  <snm>Dellaporta</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sagasser</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Jakob</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Moreno</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Buss</snm>
                  <fnm>LW</fnm>
               </au>
               <au>
                  <snm>Schierwater</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>8751</fpage>
            <lpage>8756</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1470968</pubid>
                  <pubid idtype="pmpid" link="fulltext">16731622</pubid>
                  <pubid idtype="doi">10.1073/pnas.0602076103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>My favorite animal, <it>Trichoplax adhaerens</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Schierwater</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Bioessays</source>
            <pubdate>2005</pubdate>
            <volume>27</volume>
            <fpage>1294</fpage>
            <lpage>1302</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1002/bies.20320</pubid>
                  <pubid idtype="pmpid" link="fulltext">16299758</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Global trends of whole-genome duplications revealed by the ciliate <it>Paramecium tetraurelia</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Aury</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Jaillon</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Duret</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Noel</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Jubin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Porcel</snm>
                  <fnm>BM</fnm>
               </au>
               <au>
                  <snm>S&#233;gurens</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Daubin</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Anthouard</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Aiach</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Arnaiz</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Billaut</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Beisson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Blanc</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Bouhouche</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>C&#226;mara</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Duharcourt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Guigo</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Gogendeau</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Katinka</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Keller</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Kissmehl</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Klotz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Koll</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Le Mou&#235;l</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lep&#232;re</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Malinsky</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Nowacki</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nowak</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Plattner</snm>
                  <fnm>H</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2006</pubdate>
            <volume>444</volume>
            <fpage>171</fpage>
            <lpage>178</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature05230</pubid>
                  <pubid idtype="pmpid" link="fulltext">17086204</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Functional divergence of duplicated genes formed by polyploidy during <it>Arabidopsis </it>evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2004</pubdate>
            <volume>16</volume>
            <fpage>1679</fpage>
            <lpage>1691</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">514153</pubid>
                  <pubid idtype="pmpid" link="fulltext">15208398</pubid>
                  <pubid idtype="doi">10.1105/tpc.021410</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Yeast genome evolution in the post-genome era.</p>
            </title>
            <aug>
               <au>
                  <snm>Seoighe</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Curr Opin Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>2</volume>
            <fpage>548</fpage>
            <lpage>554</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1369-5274(99)00015-6</pubid>
                  <pubid idtype="pmpid" link="fulltext">10508730</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Preservation of duplicate genes by complementary, degenerative mutations.</p>
            </title>
            <aug>
               <au>
                  <snm>Force</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lynch</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pickett</snm>
                  <fnm>FB</fnm>
               </au>
               <au>
                  <snm>Amores</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>YL</fnm>
               </au>
               <au>
                  <snm>Postlethwait</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>1999</pubdate>
            <volume>151</volume>
            <fpage>1531</fpage>
            <lpage>1545</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1460548</pubid>
                  <pubid idtype="pmpid" link="fulltext">10101175</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>Major events in the genome evolution of vertebrates: paranome age and size differ considerably between ray-finned fishes and land vertebrates.</p>
            </title>
            <aug>
               <au>
                  <snm>Vandepoele</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>De Vos</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Meyer</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Van de Peer</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>1638</fpage>
            <lpage>1643</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">341801</pubid>
                  <pubid idtype="pmpid" link="fulltext">14757817</pubid>
                  <pubid idtype="doi">10.1073/pnas.0307968100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Spatial and temporal genetic structure of the planktonic <it>Sagitta setosa </it>(Chaetognatha) in European seas as revealed by mitochondrial and nuclear DNA markers.</p>
            </title>
            <aug>
               <au>
                  <snm>Peijnenburg</snm>
                  <fnm>KT</fnm>
               </au>
               <au>
                  <snm>Fauvelot</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Breeuwer</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Menken</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>Mol Ecol</source>
            <pubdate>2006</pubdate>
            <volume>15</volume>
            <fpage>3319</fpage>
            <lpage>3338</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-294X.2006.03002.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">16968273</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Mechanisms and consequences of somatic mosaicism in humans.</p>
            </title>
            <aug>
               <au>
                  <snm>Youssoufian</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Pyeritz</snm>
                  <fnm>RE</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2002</pubdate>
            <volume>3</volume>
            <fpage>748</fpage>
            <lpage>758</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg906</pubid>
                  <pubid idtype="pmpid" link="fulltext">12360233</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>Costs and benefits of genetic heterogeneity within organisms.</p>
            </title>
            <aug>
               <au>
                  <snm>Pineda-Krch</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lehtil&#228;</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>J Evol Biol</source>
            <pubdate>2004</pubdate>
            <volume>17</volume>
            <fpage>1167</fpage>
            <lpage>1177</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1420-9101.2004.00808.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15525396</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>A model system for analyzing somatic mutations in <it>Drosophila melanogaster</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Garcia</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Derventzi</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Busuttil</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Calder</snm>
                  <fnm>RB</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>E</fnm>
                  <suf>Jr</suf>
               </au>
               <au>
                  <snm>Chadwell</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Dolle</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Lundell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Vijg</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Nat Methods</source>
            <pubdate>2007</pubdate>
            <volume>4</volume>
            <fpage>401</fpage>
            <lpage>403</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nmeth1052</pubid>
                  <pubid idtype="pmpid" link="fulltext">17435764</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>Principles of genome evolution in the <it>Drosophila melanogaster </it>species group.</p>
            </title>
            <aug>
               <au>
                  <snm>Ranz</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Maurin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Chan</snm>
                  <fnm>YS</fnm>
               </au>
               <au>
                  <snm>von Grotthuss</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>LW</fnm>
               </au>
               <au>
                  <snm>Roote</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ashburner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bergman</snm>
                  <fnm>CM</fnm>
               </au>
            </aug>
            <source>PLoS Biol</source>
            <pubdate>2007</pubdate>
            <volume>5</volume>
            <fpage>e152</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1885836</pubid>
                  <pubid idtype="pmpid" link="fulltext">17550304</pubid>
                  <pubid idtype="doi">10.1371/journal.pbio.0050152</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>The power and promise of population genomics: from genotyping to genome typing.</p>
            </title>
            <aug>
               <au>
                  <snm>Luikart</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>England</snm>
                  <fnm>PR</fnm>
               </au>
               <au>
                  <snm>Tallmon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Jordan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Taberlet</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>981</fpage>
            <lpage>994</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg1226</pubid>
                  <pubid idtype="pmpid" link="fulltext">14631358</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Operon conservation and the evolution of trans-splicing in the phylum Nematoda.</p>
            </title>
            <aug>
               <au>
                  <snm>Guiliano</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Blaxter</snm>
                  <fnm>ML</fnm>
               </au>
            </aug>
            <source>PLoS Genet</source>
            <pubdate>2006</pubdate>
            <volume>2</volume>
            <fpage>e198</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1657053</pubid>
                  <pubid idtype="pmpid" link="fulltext">17121468</pubid>
                  <pubid idtype="doi">10.1371/journal.pgen.0020198</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p><it>Caenorhabditis elegans </it>operons: form and function.</p>
            </title>
            <aug>
               <au>
                  <snm>Blumenthal</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Gleason</snm>
                  <fnm>KS</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>112</fpage>
            <lpage>120</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg995</pubid>
                  <pubid idtype="pmpid" link="fulltext">12560808</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>Gene linkage and steady state RNAs suggest trans-splicing may be associated with a polycistronic transcript in <it>Schistosoma mansoni</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Davis</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Hodgson</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>1997</pubdate>
            <volume>89</volume>
            <fpage>25</fpage>
            <lpage>39</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0166-6851(97)00097-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">9297698</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Genomic overview of mRNA 5'-leader trans-splicing in the ascidian <it>Ciona intestinalis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Satou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hamaguchi</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Takeuchi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Hastings</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Satoh</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>3378</fpage>
            <lpage>3388</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1488885</pubid>
                  <pubid idtype="pmpid" link="fulltext">16822859</pubid>
                  <pubid idtype="doi">10.1093/nar/gkl418</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Spliced-leader trans-splicing in freshwater planarians.</p>
            </title>
            <aug>
               <au>
                  <snm>Zayas</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Bold</snm>
                  <fnm>TD</fnm>
               </au>
               <au>
                  <snm>Newmark</snm>
                  <fnm>PA</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <fpage>2048</fpage>
            <lpage>2054</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi200</pubid>
                  <pubid idtype="pmpid" link="fulltext">15972844</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Animal Genome Size Database</p>
            </title>
            <url>http://www.genomesize.com</url>
         </bibl>
         <bibl id="B64">
            <title>
               <p>Vertebrate-type intron-rich genes in the marine annelid <it>Platynereis dumerilii</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Raible</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Tessmar-Raible</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Osoegawa</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Jubin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Balavoine</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Ferrier</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Benes</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>de Jong</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Weissenbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bork</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Arendt</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2005</pubdate>
            <volume>310</volume>
            <fpage>1325</fpage>
            <lpage>1326</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1119089</pubid>
                  <pubid idtype="pmpid" link="fulltext">16311335</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>Duplication and divergence: the evolution of new genes and old ideas.</p>
            </title>
            <aug>
               <au>
                  <snm>Taylor</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Raes</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>2004</pubdate>
            <volume>38</volume>
            <fpage>615</fpage>
            <lpage>643</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.genet.38.072902.092831</pubid>
                  <pubid idtype="pmpid" link="fulltext">15568988</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>Natural history and evolutionary principles of gene duplication in fungi.</p>
            </title>
            <aug>
               <au>
                  <snm>Wapinski</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Pfeffer</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Friedman</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Regev</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>449</volume>
            <fpage>54</fpage>
            <lpage>61</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature06107</pubid>
                  <pubid idtype="pmpid" link="fulltext">17805289</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>Molecular architecture of annelid nerve cord supports common origin of nervous system centralization in bilateria.</p>
            </title>
            <aug>
               <au>
                  <snm>Denes</snm>
                  <fnm>AS</fnm>
               </au>
               <au>
                  <snm>J&#233;kely</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Steinmetz</snm>
                  <fnm>PR</fnm>
               </au>
               <au>
                  <snm>Raible</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Snyman</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Prud'homme</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ferrier</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Balavoine</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Arendt</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2007</pubdate>
            <volume>129</volume>
            <fpage>277</fpage>
            <lpage>288</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cell.2007.02.040</pubid>
                  <pubid idtype="pmpid" link="fulltext">17448990</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Madden</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Sch&#228;ffer</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>3389</fpage>
            <lpage>3402</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146917</pubid>
                  <pubid idtype="pmpid" link="fulltext">9254694</pubid>
                  <pubid idtype="doi">10.1093/nar/25.17.3389</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>Modeling sequencing errors by combining hidden Markov models.</p>
            </title>
            <aug>
               <au>
                  <snm>Lottaz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Iseli</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Jongeneel</snm>
                  <fnm>CV</fnm>
               </au>
               <au>
                  <snm>Bucher</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <issue>Suppl 2</issue>
            <fpage>ii103</fpage>
            <lpage>ii112</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">14534179</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>Making sense of EST sequences by CLOBBing them.</p>
            </title>
            <aug>
               <au>
                  <snm>Parkinson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Guiliano</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Blaxter</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2002</pubdate>
            <volume>3</volume>
            <fpage>31</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">137596</pubid>
                  <pubid idtype="pmpid" link="fulltext">12398795</pubid>
                  <pubid idtype="doi">10.1186/1471-2105-3-31</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>FatiGO: a web tool for finding significant associations of Gene Ontology terms with groups of genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Al-Shahrour</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Diaz-Uriarte</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dopazo</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2004</pubdate>
            <volume>20</volume>
            <fpage>578</fpage>
            <lpage>580</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btg455</pubid>
                  <pubid idtype="pmpid" link="fulltext">14990455</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>The Bioperl toolkit: Perl modules for the life sciences.</p>
            </title>
            <aug>
               <au>
                  <snm>Stajich</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Block</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Boulez</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Brenner</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Chervitz</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Dagdigian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Fuellen</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Gilbert</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Korf</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Lapp</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lehvaslaiho</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Matsalla</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Osborne</snm>
                  <fnm>BI</fnm>
               </au>
               <au>
                  <snm>Pocock</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Schattner</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Senger</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Stein</snm>
                  <fnm>LD</fnm>
               </au>
               <au>
                  <snm>Stupka</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Wilkinson</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>1611</fpage>
            <lpage>1618</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">187536</pubid>
                  <pubid idtype="pmpid" link="fulltext">12368254</pubid>
                  <pubid idtype="doi">10.1101/gr.361602</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>Ensembl Genome Browser</p>
            </title>
            <url>http://www.ensembl.org</url>
         </bibl>
         <bibl id="B74">
            <title>
               <p>NCBI EST Database (dbEST)</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/dbEST</url>
         </bibl>
         <bibl id="B75">
            <title>
               <p>JGI Eukaryotic Genomics</p>
            </title>
            <url>http://genome.jgi-psf.org</url>
         </bibl>
         <bibl id="B76">
            <title>
               <p>NCBI Trace Archive</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/Traces</url>
         </bibl>
         <bibl id="B77">
            <title>
               <p>SimiTri--visualizing similarity relationships for groups of sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Parkinson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Blaxter</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>390</fpage>
            <lpage>395</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btf870</pubid>
                  <pubid idtype="pmpid" link="fulltext">12584125</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B78">
            <title>
               <p>PAML 4: Phylogenetic Analysis by Maximum Likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1586</fpage>
            <lpage>1591</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msm088</pubid>
                  <pubid idtype="pmpid" link="fulltext">17483113</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B79">
            <title>
               <p>A Bayesian mixture model for across-site heterogeneities in the amino-acid replacement process.</p>
            </title>
            <aug>
               <au>
                  <snm>Lartillot</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2004</pubdate>
            <volume>21</volume>
            <fpage>1095</fpage>
            <lpage>1109</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msh112</pubid>
                  <pubid idtype="pmpid" link="fulltext">15014145</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B80">
            <title>
               <p>A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Guindon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gascuel</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Syst Biol</source>
            <pubdate>2003</pubdate>
            <volume>52</volume>
            <fpage>696</fpage>
            <lpage>704</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1080/10635150390235520</pubid>
                  <pubid idtype="pmpid">14530136</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B81">
            <title>
               <p>TREEFINDER: a powerful graphical analysis environment for molecular phylogenetics.</p>
            </title>
            <aug>
               <au>
                  <snm>Jobb</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>von Haeseler</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Strimmer</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>BMC Evol Biol</source>
            <pubdate>2004</pubdate>
            <volume>4</volume>
            <fpage>18</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">459214</pubid>
                  <pubid idtype="pmpid" link="fulltext">15222900</pubid>
                  <pubid idtype="doi">10.1186/1471-2148-4-18</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B82">
            <title>
               <p>MrBayes 3: Bayesian phylogenetic inference under mixed models.</p>
            </title>
            <aug>
               <au>
                  <snm>Ronquist</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Huelsenbeck</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>1572</fpage>
            <lpage>1574</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btg180</pubid>
                  <pubid idtype="pmpid" link="fulltext">12912839</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B83">
            <title>
               <p>MEGA2: molecular evolutionary genetics analysis software.</p>
            </title>
            <aug>
               <au>
                  <snm>Kumar</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tamura</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Jakobsen</snm>
                  <fnm>IB</fnm>
               </au>
               <au>
                  <snm>Nei</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2001</pubdate>
            <volume>17</volume>
            <fpage>1244</fpage>
            <lpage>1245</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/17.12.1244</pubid>
                  <pubid idtype="pmpid" link="fulltext">11751241</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B84">
            <title>
               <p>DnaSP, DNA polymorphism analyses by the coalescent and other methods.</p>
            </title>
            <aug>
               <au>
                  <snm>Rozas</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>S&#225;nchez-DelBarrio</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Messeguer</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Rozas</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>2496</fpage>
            <lpage>2497</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btg359</pubid>
                  <pubid idtype="pmpid" link="fulltext">14668244</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B85">
            <title>
               <p>Trans-spliced leader addition to mRNAs in a cnidarian.</p>
            </title>
            <aug>
               <au>
                  <snm>Stover</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Steele</snm>
                  <fnm>RE</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2001</pubdate>
            <volume>98</volume>
            <fpage>5693</fpage>
            <lpage>5698</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">33275</pubid>
                  <pubid idtype="pmpid" link="fulltext">11331766</pubid>
                  <pubid idtype="doi">10.1073/pnas.101049998</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>

