<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2009-10-10-r111</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Genome-wide comparative analysis of the <it>Brassica rapa </it>gene space reveals genome shrinkage and differential loss of duplicated genes after whole genome triplication</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Mun</snm>
               <fnm>Jeong-Hwan</fnm>
               <insr iid="I1"/>
               <email>munjh@rda.go.kr</email>
            </au>
            <au id="A2">
               <snm>Kwon</snm>
               <fnm>Soo-Jin</fnm>
               <insr iid="I1"/>
               <email>sjkwon@rda.go.kr</email>
            </au>
            <au id="A3">
               <snm>Yang</snm>
               <fnm>Tae-Jin</fnm>
               <insr iid="I2"/>
               <email>tjyang@snu.ac.kr</email>
            </au>
            <au id="A4">
               <snm>Seol</snm>
               <fnm>Young-Joo</fnm>
               <insr iid="I1"/>
               <email>yseol@rda.go.kr</email>
            </au>
            <au id="A5">
               <snm>Jin</snm>
               <fnm>Mina</fnm>
               <insr iid="I1"/>
               <email>genemina@rda.go.kr</email>
            </au>
            <au id="A6">
               <snm>Kim</snm>
               <fnm>Jin-A</fnm>
               <insr iid="I1"/>
               <email>jakim@rda.go.kr</email>
            </au>
            <au id="A7">
               <snm>Lim</snm>
               <fnm>Myung-Ho</fnm>
               <insr iid="I1"/>
               <email>mlim312@rda.go.kr</email>
            </au>
            <au id="A8">
               <snm>Kim</snm>
               <fnm>Jung Sun</fnm>
               <insr iid="I1"/>
               <email>jsnkim@rda.go.kr</email>
            </au>
            <au id="A9">
               <snm>Baek</snm>
               <fnm>Seunghoon</fnm>
               <insr iid="I1"/>
               <email>yohan_bosco@hotmail.com</email>
            </au>
            <au id="A10">
               <snm>Choi</snm>
               <fnm>Beom-Soon</fnm>
               <insr iid="I3"/>
               <email>bschoi@nicem.snu.ac.kr</email>
            </au>
            <au id="A11">
               <snm>Yu</snm>
               <fnm>Hee-Ju</fnm>
               <insr iid="I4"/>
               <email>yuheeju@rda.go.kr</email>
            </au>
            <au id="A12">
               <snm>Kim</snm>
               <fnm>Dae-Soo</fnm>
               <insr iid="I5"/>
               <email>kds2465@kribb.re.kr</email>
            </au>
            <au id="A13">
               <snm>Kim</snm>
               <fnm>Namshin</fnm>
               <insr iid="I5"/>
               <email>n@rna.kr</email>
            </au>
            <au id="A14">
               <snm>Lim</snm>
               <fnm>Ki-Byung</fnm>
               <insr iid="I6"/>
               <email>kblim@knu.ac.kr</email>
            </au>
            <au id="A15">
               <snm>Lee</snm>
               <fnm>Soo-In</fnm>
               <insr iid="I1"/>
               <email>silee@rda.go.kr</email>
            </au>
            <au id="A16">
               <snm>Hahn</snm>
               <fnm>Jang-Ho</fnm>
               <insr iid="I1"/>
               <email>jhhahn@rda.go.kr</email>
            </au>
            <au id="A17">
               <snm>Lim</snm>
               <fnm>Yong Pyo</fnm>
               <insr iid="I7"/>
               <email>yplim@cnu.ac.kr</email>
            </au>
            <au id="A18">
               <snm>Bancroft</snm>
               <fnm>Ian</fnm>
               <insr iid="I8"/>
               <email>ian.bancroft@bbsrc.ac.uk</email>
            </au>
            <au ca="yes" id="A19">
               <snm>Park</snm>
               <fnm>Beom-Seok</fnm>
               <insr iid="I1"/>
               <email>pbeom@rda.go.kr</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Agricultural Biotechnology, National Academy of Agricultural Science, Rural Development Administration, 150 Suin-ro, Gwonseon-gu, Suwon 441-707, Korea</p>
            </ins>
            <ins id="I2">
               <p>Department of Plant Science College of Agriculture and Life Sciences, Seoul National University, San 56-1, Sillim-dong, Gwanak-gu, Seoul 151-921, Korea</p>
            </ins>
            <ins id="I3">
               <p>National Instrumentation Center for Environmental Management, College of Agriculture and Life Sciences, Seoul National University, San 56-1, Sillim-dong, Gwanak-gu, Seoul 151-921, Korea</p>
            </ins>
            <ins id="I4">
               <p>Vegetable Research Division, National Institute of Horticultural and Herbal Science, Rural Development Administration, Tap-dong 540-41, Gwonseon-gu, Suwon 441-440, Korea</p>
            </ins>
            <ins id="I5">
               <p>Korea Research Institute of Bioscience and Biotechnology, 111 Gwahangno, Yuseong-gu, Daejeon 305-806, Korea</p>
            </ins>
            <ins id="I6">
               <p>School of Applied Biosciences, College of Agriculture and Life Sciences, Kyungpook National University, Daegu 702-701, Korea</p>
            </ins>
            <ins id="I7">
               <p>Department of Horticulture, Chungnam National University, 220 Kung-dong, Yusong-gu, Daejon 305-764, Korea</p>
            </ins>
            <ins id="I8">
               <p>John Innes Centre, Norwich Research Centre, Colney, Norwich NR4 7UH, UK</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2009</pubdate>
         <volume>10</volume>
         <issue>10</issue>
         <fpage>R111</fpage>
         <url>http://genomebiology.com/2009/10/10/R111</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="doi">10.1186/gb-2009-10-10-r111</pubid>
               <pubid idtype="pmpid">19821981</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>18</day>
               <month>5</month>
               <year>2009</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>9</day>
               <month>8</month>
               <year>2009</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>12</day>
               <month>10</month>
               <year>2009</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>12</day>
               <month>10</month>
               <year>2009</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2009</year>
         <collab>Mun et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited</note>
      </cpyrt>
      <shorttitle>
         <p>Brassica rapa genome</p>
      </shorttitle>
      <shortabs>
         <p>Euchromatic regions of the Brassica rapa genome were sequenced and mapped onto the corresponding regions in the Arabidopsis thaliana genome.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p><it>Brassica rapa </it>is one of the most economically important vegetable crops worldwide. Owing to its agronomic importance and phylogenetic position, <it>B. rapa </it>provides a crucial reference to understand polyploidy-related crop genome evolution. The high degree of sequence identity and remarkably conserved genome structure between <it>Arabidopsis </it>and <it>Brassica </it>genomes enables comparative tiling sequencing using <it>Arabidopsis </it>sequences as references to select the counterpart regions in <it>B. rapa</it>, which is a strong challenge of structural and comparative crop genomics.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>We assembled 65.8 megabase-pairs of non-redundant euchromatic sequence of <it>B. rapa </it>and compared this sequence to the <it>Arabidopsis </it>genome to investigate chromosomal relationships, macrosynteny blocks, and microsynteny within blocks. The triplicated <it>B. rapa </it>genome contains only approximately twice the number of genes as in <it>Arabidopsis </it>because of genome shrinkage. Genome comparisons suggest that <it>B. rapa </it>has a distinct organization of ancestral genome blocks as a result of recent whole genome triplication followed by a unique diploidization process. A lack of the most recent whole genome duplication (3R) event in the <it>B. rapa </it>genome, atypical of other <it>Brassica </it>genomes, may account for the emergence of <it>B. rapa </it>from the <it>Brassica </it>progenitor around 8 million years ago.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>This work demonstrates the potential of using comparative tiling sequencing for genome analysis of crop species. Based on a comparative analysis of the <it>B. rapa </it>sequences and the <it>Arabidopsis </it>genome, it appears that polyploidy and chromosomal diploidization are ongoing processes that collectively stabilize the <it>B. rapa </it>genome and facilitate its evolution.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010008">Evolution</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010015">Model organisms</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010019">Plant biology</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Flowering plants (angiosperms) have evolved in genome size since their sudden appearance in the fossil records of the late Jurassic/early Cretaceous period <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr></abbrgrp>. The genome expansion seen in angiosperms is mainly attributable to occasional polyploidy. Estimation of polyploidy levels in angiosperms indicates that the genomes of most (>90%) extant angiosperms, including many crops and all the plant model species sequenced thus far, have experienced one or more episodes of genome doubling at some point in their evolutionary history <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr></abbrgrp>. The accumulation of transposable elements (TEs) has been another prevalent factor in plant genome expansion. Recent studies on maize, rice, legumes, and cotton have demonstrated that the genome sizes of these crop species have increased significantly due to the accumulation and/or retention of TEs (mainly long terminal repeat retrotransposons (LTRs)) over the past few million years; the percentage of the genome made up of transposons is estimated to be between 35% and 52% based on sequenced genomes <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. However, genome expansion is not a one-way process in plant genome evolution. Functional diversification or stochastic deletion of redundant genes by accumulation of mutations in polyploid genomes and removal of LTRs via illegitimate or intra-strand recombination can result in downsizing of the genome <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr></abbrgrp>. Nevertheless, neither of the aforementioned mechanisms has been demonstrated to occur frequently enough to balance genome size growth, and plant genomes tend, therefore, to expand over time.</p>
         <p>The progress in whole genome sequencing of model genomes presents an important challenge in plant genomics: to apply the knowledge gained from the study of model genomes to biological and agronomical questions of importance in crop species. Comparative structural genomics is a well-established strategy in applied agriculture in several plant families. However, comparative analyses of modern angiosperm genomes, which have experienced multiple rounds of polyploidy followed by differential loss of redundant sequences, genome recombination, or invasion of LTRs, are characterized by interrupted synteny with only partial gene orthology even between closely related species, such as cereals <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, legumes <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>, and <it>Brassica </it>species <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. Furthermore, functional divergence of duplicated genes limits interpretation of function based on orthology, which complicates knowledge transfer from model to crop plants. Thus, better delimitation of comparative genome arrangements reflecting evolutionary history will allow information obtained from fully sequenced model genomes to be used to target syntenic regions of interest and to infer parallel or convergent evolution of homologs important to biological and agronomical questions in closely related crop genomes.</p>
         <p>The mustard family (Brassicaceae or Cruciferae), the fifth largest monophyletic angiosperm family, consists of 338 genera and approximately 3,700 species in 25 tribes <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>, and is fundamentally important to agriculture and the environment, accounting for approximately 10% of the world's vegetable crop produce and serving as a major source of edible oil and biofuel <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. Brassicaceae includes two important model systems: <it>Arabidopsis thaliana </it>(<it>At</it>), the most scientifically important plant model system for which complete genome sequence information is available, and the closely related, agriculturally important <it>Brassica </it>complex - <it>B. rapa </it>(<it>Br</it>, A genome), <it>B. nigra </it>(<it>Bn</it>, B genome), <it>B. oleracea </it>(<it>Bo</it>, C genome), and their three allopolyploids, <it>B. napus </it>(<it>Bna</it>, AC genome), <it>B. juncea </it>(<it>Bj</it>, AB genome), and <it>B. carinata </it>(<it>Bc</it>, BC genome). Syntenic relationships and polyploidy history in these two model systems have been investigated, although details about macro- and microsyntenic relationships between <it>At </it>and <it>Brassica </it>are limited and fragmented. Previous studies demonstrated broad-range chromosome correspondence between the <it>At </it>and <it>Brassica </it>genomes <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr></abbrgrp>, and a few studies have demonstrated specific cases of conservation of gene content and order with frequent disruption by interspersed gene loss and genome recombination <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. Although this issue is contentious, there is evidence that Brassicaceae genomes have undergone three rounds of whole genome duplication (WGD; hereafter referred to as 1R, 2R, and 3R, which are equivalent to the &#947;, &#946;, and &#945; duplication events) <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B25">25</abbr><abbr bid="B26">26</abbr></abbrgrp>. One profound finding from comparative analyses is the triplicate nature of the <it>Brassica </it>genome, indicating the occurrence of a whole genome triplication event (WGT, 4R) soon after divergence from the <it>At </it>lineage approximately 17 to 20 million years ago (MYA) <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr><abbr bid="B26">26</abbr></abbrgrp>. This result strongly suggests that comparative genomic analyses using single gene-specific amplicons or those based on small scale synteny comparisons will fail to identify all related genome segments, and thus not be able to provide accurate indications of orthology between the <it>At </it>and <it>Brassica </it>genomes. However, obtaining sufficient sequence information from <it>Brassica </it>genomes to identify genome-wide orthologous relationships between the <it>At </it>and <it>Brassica </it>genomes is a major challenge.</p>
         <p><it>Br </it>was recently chosen as a model species representing the <it>Brassica </it>'A' genome for genome sequencing <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>. This species was selected because it has already proved a useful model for studying polyploidy and because it has a relatively small (approximately 529 megabase-pair (Mbp)) but compact genome with genes concentrated in euchromatic spaces. However, widespread repetitive sequences in the <it>Br </it>genome hinder direct application of whole genome shotgun sequencing. Instead, targeted sequencing of specific regions of the <it>Br </it>genome could be informed by the reference <it>At </it>genome by selecting genomic clones based on sequence similarity; this approach is referred to as comparative tiling <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>. Here, we report sequencing of large-scale regions of the <it>Br </it>euchromatic genome, covering almost all of the <it>At </it>euchromatic regions, obtained using the comparative tiling method. We performed a genome-wide sequence comparison of <it>Br </it>and <it>At </it>and analyzed the number of substitutions per synonymous site (Ks) between the two genomes and among related <it>Brassica </it>sequences to identify syntenic relationships and to further refine our understanding of the evolution of polyploidy. We also investigated genome microstructure conservation between the two genomes. In this study, we provide a foundation to reconstruct both the ancestral genome of the <it>Brassica </it>progenitor and the evolutionary history of the <it>Brassica </it>lineage, which we anticipate will provide a robust model for <it>Brassica </it>genomic studies and facilitate the investigation of the genome evolution of domesticated crop species.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Generation of <it>Br </it>euchromatic sequence contigs and genome coverage</p>
            </st>
            <p>Bacterial artificial chromosome (BAC) sequence assembly generated 410 <it>Br </it>sequence contigs (sequences composed of more than one BAC sequence) covering 65.8 Mbp (Tables S1 and S2 in Additional data file 1). These sequence contigs span 75.3 Mbp of the <it>At </it>genome, representing 92.2% of the total <it>At </it>euchromatic region (Figure <figr fid="F1">1</figr> and Table <tblr tid="T1">1</tblr>). A total of 43.9 Mbp remain as uncovered gaps: among these, 6.4 Mbp are attributable to euchromatin gaps, and the remaining 37.5 Mbp to pericentromeric heterochromatin gaps.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Summary of <it>B. rapa </it>chromosome sequences comparatively tiled on the <it>A. thaliana </it>genome</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="6" ca="center">
                        <p>
                           <b>
                              <it>B. rapa</it>
                           </b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b><it>A</it>. <it>thaliana</it></b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Number of BACs</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Number of sequence contigs</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Total sequence length (Mbp)</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Coverage of <it>At </it>genome (Mbp)</b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b>Gaps of <it>At </it>genome (Mbp)</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Euchromatin</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Heterochromatin</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>At1</p>
                     </c>
                     <c ca="center">
                        <p>147</p>
                     </c>
                     <c ca="center">
                        <p>105</p>
                     </c>
                     <c ca="center">
                        <p>16.5</p>
                     </c>
                     <c ca="center">
                        <p>18.5</p>
                     </c>
                     <c ca="center">
                        <p>1.4</p>
                     </c>
                     <c ca="center">
                        <p>10.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>At2</p>
                     </c>
                     <c ca="center">
                        <p>98</p>
                     </c>
                     <c ca="center">
                        <p>59</p>
                     </c>
                     <c ca="center">
                        <p>10.3</p>
                     </c>
                     <c ca="center">
                        <p>12.4</p>
                     </c>
                     <c ca="center">
                        <p>1.4</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>At3</p>
                     </c>
                     <c ca="center">
                        <p>124</p>
                     </c>
                     <c ca="center">
                        <p>89</p>
                     </c>
                     <c ca="center">
                        <p>14.2</p>
                     </c>
                     <c ca="center">
                        <p>15.7</p>
                     </c>
                     <c ca="center">
                        <p>0.4</p>
                     </c>
                     <c ca="center">
                        <p>7.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>At4</p>
                     </c>
                     <c ca="center">
                        <p>97</p>
                     </c>
                     <c ca="center">
                        <p>73</p>
                     </c>
                     <c ca="center">
                        <p>11.3</p>
                     </c>
                     <c ca="center">
                        <p>11.4</p>
                     </c>
                     <c ca="center">
                        <p>0.9</p>
                     </c>
                     <c ca="center">
                        <p>6.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>At5</p>
                     </c>
                     <c ca="center">
                        <p>123</p>
                     </c>
                     <c ca="center">
                        <p>84</p>
                     </c>
                     <c ca="center">
                        <p>13.5</p>
                     </c>
                     <c ca="center">
                        <p>17.3</p>
                     </c>
                     <c ca="center">
                        <p>2.3</p>
                     </c>
                     <c ca="center">
                        <p>7.4</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>589</p>
                     </c>
                     <c ca="center">
                        <p>410</p>
                     </c>
                     <c ca="center">
                        <p>65.8</p>
                     </c>
                     <c ca="center">
                        <p>75.3</p>
                     </c>
                     <c ca="center">
                        <p>6.4</p>
                     </c>
                     <c ca="center">
                        <p>37.5</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Sequence length and coverage were calculated according to Tables S1 and S2 in Additional data file 1.</p>
               </tblfn>
            </tbl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p><it>In silico </it>allocation of 410 <it>B. rapa </it>BAC sequence contigs to <it>A. thaliana </it>chromosomes</p>
               </caption>
               <text>
                  <p><it>In silico </it>allocation of 410 <it>B. rapa </it>BAC sequence contigs to <it>A. thaliana </it>chromosomes. BAC sequence contigs (blue bars) were aligned to <it>At </it>chromosomes based on significant and directional matches of sequences using a BLASTZ cutoff of &lt;E<sup>-6</sup>.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-1"/>
            </fig>
            <p>The genome coverage of the gene-rich <it>Br </it>sequences was estimated by representation in two different datasets: expressed sequence tag (EST) sequences and conserved single-copy genes. Based on a BLAT analysis of 32,395 <it>Br </it>unigenes (a set of ESTs that appear to arise from the same transcription locus) against the sequence contigs, the proportion of hits recovered under stringent conditions (see Materials and methods) was 29.2%. This result was largely consistent with the proportion of rosid-conserved single-copy genes showing matches to <it>Br </it>sequences. A TBLASTN comparison of 1,070 <it>At</it>-<it>Medicago truncatula </it>(<it>Mt</it>) conserved single-copy genes against <it>Br </it>sequences revealed a 24.3% match. Both methods indicate approximately 30% coverage of euchromatin in the dataset analyzed; thus, the euchromatic region of <it>Br </it>is estimated to be approximately 220 Mbp, 42% of the whole genome given that the genome size of <it>Br </it>is 529 Mbp <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Characteristics of the <it>B. rapa </it>gene space</p>
            </st>
            <p>Gene annotation was carried out using our specialized <it>Br </it>annotation pipeline. Gene prediction of the <it>Br </it>sequence data using a variety of <it>ab initio</it>, similarity-based, and EST/full-length cDNA-based methods resulted in the construction of 15,762 gene models. Taken together with the genome coverage of <it>Br </it>sequences, the overall number of protein-coding genes in the <it>Br </it>genome is at least 52,000 to 53,000, which is higher than those of other plant genomes sequenced thus far, including <it>At </it><abbrgrp><abbr bid="B7">7</abbr></abbrgrp>, rice (<it>Oryza sativa </it>(<it>Os</it>)) <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>, poplar (<it>Populus trichocarpa </it>(<it>Pt</it>)) <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, grape <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, papaya <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>, and sorghum <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. However, the estimated total number of genes in the <it>Br </it>genome is only twice that of <it>At</it>. Details of the annotation are available online at the URL cited in the 'Data used in this study' section in the Materials and methods.</p>
            <p>The gene structure and density statistics are shown in Table <tblr tid="T2">2</tblr>. The base composition of <it>Br </it>and <it>At </it>genes is very similar. The average length of <it>Br </it>genes (ATG to stop codon) is 73% that of <it>At </it>genes. This is consistent with previous reports on <it>Bo </it><abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr><abbr bid="B26">26</abbr></abbrgrp>. This difference appears to be due to one less exon per gene and shorter exon and intron lengths in <it>Br</it>. The average gene density of 1 per 4.2 kilobase-pairs (kbp) in <it>Br </it>is slightly lower than that in <it>At </it>(1 per 3.8 kbp). Thus, the <it>At</it>/<it>Br </it>ratio of gene density is 0.90, indicating slightly less compact organization of <it>Br </it>euchromatin than <it>At </it>euchromatin. Moreover, the distance between the homologous block endpoints in <it>Br </it>and <it>At </it>has an R<sup>2 </sup>of 0.63 with a <it>dAt</it>/<it>dBr </it>slope of 1.36 (Figure S1 in Additional data file 2). This result indicates that gene-containing regions in <it>At </it>occupy approximately 30 to 40% more space than their <it>Br </it>counterparts. Based on these data and the results mentioned above, we postulate that the euchromatic genome of <it>Br </it>has shrunken by approximately 30% compared to its syntenic <it>At </it>counterpart. Most of the genome shrinkage in <it>Br </it>could be explained by the deletion of roughly one-third of the redundant proteome as well as TEs in the euchromatic <it>Br </it>genome. Only 14% of the <it>Br </it>genes were tandem duplicates compared with 27% of <it>At </it>genes in a 100-kbp window interval. In addition, only 45 nucleotide binding site-encoding genes were identified in <it>Br</it>, suggesting that the total number of nucleotide binding site-encoding genes in the <it>Br </it>genome is likely to be almost the same as that in <it>At </it>(approximately 200) <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr></abbrgrp>. A database search revealed that a total of 12,802 (81%) of the predicted <it>Br </it>genes have similarity (&lt;E<sup>-10</sup>) to proteins in the non-redundant nucleotide database of the National Center for Biotechnology Information (NCBI); 2,960 (19%) are <it>Br </it>unique genes. To assess the putative function of the genes that recorded no hits to non-redundant proteins, we assigned functional categories to the <it>Br </it>unique genes using gene ontology analysis; however, this analysis could not identify a putative function for approximately 85% of the <it>Br </it>unique genes. Thus, we can conclude that 16% of the proteome of <it>Br </it>has acquired a novel function since the <it>Br</it>-<it>At </it>divergence.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Comparison of the overall composition of annotated protein coding genes in the <it>B. rapa </it>sequence contigs and euchromatic counterparts in the <it>A. thaliana </it>genome</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>
                           <b>Feature</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>B. rapa</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b><it>A</it>. thaliana*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Number of sequence contigs</p>
                     </c>
                     <c ca="center">
                        <p>410</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total sequence length (Mbp)</p>
                     </c>
                     <c ca="center">
                        <p>65.8</p>
                     </c>
                     <c ca="center">
                        <p>75.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transposons (%)</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Number of protein coding genes</p>
                     </c>
                     <c ca="center">
                        <p>15,762</p>
                     </c>
                     <c ca="center">
                        <p>19,639</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Number of exons per gene</p>
                     </c>
                     <c ca="center">
                        <p>4.7</p>
                     </c>
                     <c ca="center">
                        <p>5.5</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Intron size (bp)</p>
                     </c>
                     <c ca="center">
                        <p>141</p>
                     </c>
                     <c ca="center">
                        <p>162</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Exon size (bp)</p>
                     </c>
                     <c ca="center">
                        <p>225</p>
                     </c>
                     <c ca="center">
                        <p>230</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Average gene size (kbp)</p>
                     </c>
                     <c ca="center">
                        <p>1.6</p>
                     </c>
                     <c ca="center">
                        <p>2.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Average gene density (kbp/gene)</p>
                     </c>
                     <c ca="center">
                        <p>4.2</p>
                     </c>
                     <c ca="center">
                        <p>3.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Overall G/C content (%)</p>
                     </c>
                     <c ca="center">
                        <p>35.2</p>
                     </c>
                     <c ca="center">
                        <p>35.8</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Exons</p>
                     </c>
                     <c ca="center">
                        <p>46.3</p>
                     </c>
                     <c ca="center">
                        <p>44.6</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Introns</p>
                     </c>
                     <c ca="center">
                        <p>32.6</p>
                     </c>
                     <c ca="center">
                        <p>32.0</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Intergenic regions</p>
                     </c>
                     <c ca="center">
                        <p>31.3</p>
                     </c>
                     <c ca="center">
                        <p>31.8</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*<it>A. thaliana </it>statistics are based on version TAIR7 annotation available on the <it>Arabidopsis </it>Information Resource website <abbrgrp><abbr bid="B74">74</abbr></abbrgrp>.</p>
               </tblfn>
            </tbl>
            <p>Repetitive sequence analysis revealed that 6% of euchromatic <it>Br </it>sequences are composed of TEs, a twofold greater amount than identified in the counterpart <it>At </it>euchromatic genome, presumably due to a greater number of LTRs and long interspersed elements (Table <tblr tid="T3">3</tblr>). In addition, low complexity repetitive sequences are relatively abundant in the <it>Br </it>euchromatic region, indicating <it>Br</it>-specific expansion of repetitive sequences. The distribution of repetitive sequences and TEs along the chromosomes was not uneven (Figure S2 in Additional data file 2). It has previously been reported, based on partial draft genome shotgun sequences, that <it>Bo </it>(approximately 696 Mbp) has a significantly higher proportion of both class I and class II TEs sequences than <it>At </it><abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Taken together with these previous reports <abbrgrp><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr></abbrgrp>, TEs appear to be partly responsible for genome expansion in the <it>Brassica </it>lineage, and these TEs appear to accumulate predominantly in the heterochromatic regions of <it>Br</it>.</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Comparison of repetitive sequences identified in the <it>B. rapa </it>sequence contigs and euchromatic counterparts in the <it>A. thaliana </it>genome</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b>Genome coverage (%)*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Family</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>B. rapa</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>A. thaliana</it>
                           </b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>SINEs</p>
                     </c>
                     <c ca="center">
                        <p>0.1</p>
                     </c>
                     <c ca="center">
                        <p>0.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>LINEs</p>
                     </c>
                     <c ca="center">
                        <p>1.3</p>
                     </c>
                     <c ca="center">
                        <p>0.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>LTRs</p>
                     </c>
                     <c ca="center">
                        <p>2.4</p>
                     </c>
                     <c ca="center">
                        <p>0.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>DNA transposons</p>
                     </c>
                     <c ca="center">
                        <p>2.2</p>
                     </c>
                     <c ca="center">
                        <p>1.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Satellites</p>
                     </c>
                     <c ca="center">
                        <p>0.4</p>
                     </c>
                     <c ca="center">
                        <p>0.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Low complexity repetitive sequences</p>
                     </c>
                     <c ca="center">
                        <p>4.4</p>
                     </c>
                     <c ca="center">
                        <p>1.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Other<sup>&#8224;</sup></p>
                     </c>
                     <c ca="center">
                        <p>0.4</p>
                     </c>
                     <c ca="center">
                        <p>0.1</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>11.2</p>
                     </c>
                     <c ca="center">
                        <p>3.8</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Genome coverage was calculated using 65.8 Mbp for <it>B. rapa </it>and 75.3 Mbp for the euchromatic counterpart of <it>A. thaliana</it>. <sup>&#8224;</sup>This refers to simple sequence repeats and short tandem repeats. LINE, long interspersed element; SINE, short interspersed element.</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Synteny between the <it>B. rapa </it>and <it>A. thaliana </it>genomes</p>
            </st>
            <p>To identify syntenic regions in the <it>Br </it>and <it>At </it>genomes, we compared the whole proteome between the two genomes using BLASTP analysis, and putative synteny blocks were plotted using DiagHunter and GenoPix2D programs <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. The non-redundant chromosome-ordered genome sequence in the <it>Br </it>build was 62.5 Mbp. An additional 3.2 Mbp had not yet been assigned to chromosomes and was therefore not used for synteny analysis. We examined the synteny blocks at three different levels: whole genome (Figure <figr fid="F2">2a</figr>), large-scale synteny blocks in chromosome-to-chromosome windows (Figure <figr fid="F2">2b</figr>; Additional data file 3), and microsynteny &lt;2.5 Mbp (the synteny can be viewed at the URL cited in the 'Data used in this study' section in the Materials and methods). Although the <it>Br </it>genome build was partial and incomplete with only approximately 30% of euchromatin represented and some misordered contigs present, the level of synteny between the genomes was prominent and distinct. The DiagHunter program detected 227 highly homologous syntenic blocks with 72% of the sequenced and anchored <it>Br </it>sequence assigned to synteny blocks in <it>At </it>and 72% of <it>At </it>euchromatic sequence assigned to synteny blocks in <it>Br </it>when multiple blocks overlapping the same region were counted (Figure <figr fid="F2">2a</figr>). Considering the history of frequent genome duplication events in Brassicaceae, this result strongly indicates the presence of secondary or tertiary blocks resulting from WGT.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Synteny between the <it>B. rapa </it>and <it>A. thaliana </it>genomes</p>
               </caption>
               <text>
                  <p>Synteny between the <it>B. rapa </it>and <it>A. thaliana </it>genomes. <b>(a) </b>Percent coverage of individual chromosomes showing synteny between <it>B. rapa </it>and <it>A. thaliana</it>. Coverage was calculated as the gene number of an individual chromosome per sum of genes with BLASTP hits. Note that the overall coverage of an individual chromosome for the counterpart genome can exceed 100% because multiple best BLAST hits over the same region are counted. <b>(b) </b>Chromosome correspondence between <it>B. rapa </it>and <it>A. thaliana </it>represented by a dot-plot. Each dot represents a reciprocal best BLASTP match between gene pairs at an E-value cutoff of &lt;E<sup>-20</sup>. Red dots show regions of synteny with more than 50% gene conservation as identified by DiagHunter. Some <it>Br </it>chromosome orientations have been flipped (A1<sup>f</sup>, A3<sup>f</sup>, A7<sup>f</sup>) to visually correspond to <it>At </it>orientations. Both <it>Br </it>and <it>At </it>have been scaled to occupy the same lengths. Color bars on the upper and left margins of the dot plot indicate individual chromosomes of <it>At </it>and <it>Br</it>, respectively. Black dots on the <it>At </it>chromosomes are centromeres. The color-shaded boxes in the dot plots represent long-range synteny blocks along chromosome pairs. Boxes with the same color are putative triplicated remnants. See Additional data file 3 and the URL cited in Materials and methods for all dot plots and related results, including detailed close-ups of regions of synteny.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-2"/>
            </fig>
            <p>The <it>Br </it>and <it>At </it>genomes share a minimum of 20 large-scale synteny blocks with substantial microsynteny; these synteny blocks extend the length of whole chromosome arms. <it>At </it>shows synteny of chromosome arms with multiple chromosome blocks of <it>Br</it>, apparently corresponding to triplicated remnants (Figure <figr fid="F2">2b</figr>). <it>At</it>1S (short arm), <it>At</it>2L (long arm), <it>At</it>4L, and <it>At</it>5 have three long-range synteny counterparts in three independent <it>Br </it>chromosomes. However, <it>At</it>1L and <it>At</it>3 have only one or two synteny blocks in the <it>Br </it>genome. Moreover, some genome regions of <it>At</it>, including a smaller section of <it>At</it>2S and <it>At</it>4S, show no significant synteny with <it>Br </it>counterparts, indicating chromosome-level deletion of triplicated segments. Incidentally, <it>Br </it>shows synteny with a major single chromosome along almost the entire length (A1, A2, A4, and A10) or fragments of multiple <it>At </it>chromosomes in a complicated mosaic pattern, indicating frequent recombination of <it>Br </it>chromosomes. Notable regions of synteny are shown in Figure <figr fid="F2">2b</figr>, and are At1S-A6/A8/A9, At1L-A7, At2L-A3/A4/A5, At3S-A3/A5, At3L-A7/A9, At4L-A1/A3/A8, and At5-A2/A3/A10 (synteny view available at the URL cited in the 'Data used in this study' section in the Materials and methods. Additional synteny blocks scattered throughout genome regions, probably due to recombination, were also identified.</p>
            <p>Within individual synteny blocks, microsynteny (conservation of gene content and order) was considerable. The average degree of proteome conservation for all predicted synteny blocks was 52 &#177; 13% in the blocks (Table S3 in Additional data file 1). This value is almost the same as that of the <it>Mt</it>-<it>Lotus japonicus </it>comparison in which an ancient WGD event at a similar time period (Ks 0.7 to 0.9) as the <it>Br</it>-<it>At </it>WGD but earlier speciation (Ks 0.6) than <it>Br</it>-<it>At </it>was detected <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. The underestimated value reported here presumably reflects significant gene loss and rearrangement after WGT in the <it>Br </it>lineage resulting in genome shrinkage, based on the fact that deletion events in syntenic blocks of the <it>Br </it>genome were twofold more frequent than in the <it>At </it>genome. Genes without corresponding homologs in syntenic regions contributed to 15 &#177; 7% of all genes from <it>Br </it>but 33 &#177; 13% from <it>At </it>(Table S3 in Additional data file 1; Additional data file 3). Genes encoding proteins involved in transcription or signal transduction were not found to be significantly more retained in syntenic blocks than those encoding proteins classified as having other functions. Further genome sequencing will help resolve the synteny in the uncovered and/or the scattered genome regions.</p>
         </sec>
         <sec>
            <st>
               <p>Rearrangement of the <it>B. rapa </it>genome</p>
            </st>
            <p>Comparison of the genomes of <it>Br </it>and <it>At </it>allows insight into the origin and evolution of the <it>Brassica </it>'A' genome. Previous comparative mapping studies have identified a putative ancestral karyotype (<it>AK</it>) comprising 24 building blocks on 8 chromosomes from which the current <it>Arabidopsis </it>and <it>Brassica </it>genomes have evolved via fusion/fission, rearrangement, and deletion of chromosomes followed by polyploidy <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B37">37</abbr><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr></abbrgrp>. According to the <it>At</it>-<it>AK </it>relationship and pair information of <it>Br</it>-<it>At </it>synteny blocks, we defined conserved genome building blocks of <it>AK </it>on the <it>Br </it>genome build (Figure <figr fid="F3">3</figr>; Additional data file 4). The pattern of block boundaries on <it>Br </it>chromosomes was similar to that reported pattern for <it>Bna </it>'A' genome components, albeit more complicated (Figure S3 in Additional data file 2). Most of the block boundaries were conserved between <it>Br </it>and the 'A' genome components of <it>Bna </it>with the exception of several insertions/deletions; this is presumably due to limited sequence and marker information. In addition, inversion or serial mismatched block boundaries were found on A2, A7 and A9, respectively, suggesting recombination of homologous counterpart regions between the 'A' and 'C' genomes in <it>Bna</it>.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Comparison of the genome structures of <it>B. rapa </it>and <it>A. thaliana </it>based on 24 ancestral karyotype genome building blocks</p>
               </caption>
               <text>
                  <p>Comparison of the genome structures of <it>B. rapa </it>and <it>A. thaliana </it>based on 24 ancestral karyotype genome building blocks. The genome structure of <it>At </it>was based on the reports of Schranz <it>et al</it>. <abbrgrp><abbr bid="B37">37</abbr></abbrgrp> and Lysak <it>et al</it>. <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. The position of genome blocks in the <it>Br </it>chromosome was defined by a comparison of <it>Br</it>-<it>At </it>syntenic relationships and the <it>At</it>-<it>AK </it>mapping results. <it>Br </it>sequences were connected to form continuous sequences. Block boundaries, orientation, and gaps between syntenic blocks are shown in Additional data file 4. Each color corresponds to a syntenic region between genomes. The <it>Br </it>genome is triplicated and more thoroughly rearranged than the <it>At </it>genome.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-3"/>
            </fig>
            <p>An examination of the <it>Br </it>genome from the perspective of ancestral blocks reveals that three copies of the genome are present, as predicted from the WGT (Figure <figr fid="F3">3</figr>). Although there are several discontinuous matches due to gaps between syntenic blocks, almost 50% of the ancestral blocks were triplicated in the <it>Br </it>genome, while others occurred only once or twice, indicating loss of blocks during genome rearrangement. Blocks D, G, and M could not be found on the <it>Br </it>genome. The <it>Br </it>genome is highly rearranged relative to <it>At </it>compared with <it>AK</it>. Block R was localized together with block W in triplicate regions (A2, A3, and A10). However, in At5, blocks R and W were separated on the short arm and long arm, respectively <abbrgrp><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr></abbrgrp>. Similarly, blocks E and N were adjacent and triplicated in <it>Br </it>but separated in <it>At</it>. Meanwhile, blocks K and L, which are fused in <it>AK </it>but split in different chromosomes of <it>At</it>, were adjacent (A6) or separated (A9) on the same chromosomes of <it>Br</it>. However, we did not determine precisely which copy of the replicated <it>AK </it>block family corresponds to the <it>Br </it>BACs because of the possibility that <it>Br </it>sequences in the polyploid genome were not accurately positioned. Because several genetic markers originate from duplicate or triplicate regions of the <it>Br </it>genome, the true location of the BACs could correspond to any of the amplified bands, which could result in inaccurate mapping of the BAC sequence. In this case, the resulting assignment of the BAC to an incorrect linkage group on a specific <it>AK </it>block family member would also be flawed; however, we found that almost all BAC sequences showed excellent correspondence to the correct family of <it>AK </it>blocks. Further analysis, including chromosome painting and additional genome sequencing, will allow determination of the precise location of <it>AK </it>blocks in the <it>Br </it>genome.</p>
         </sec>
         <sec>
            <st>
               <p>Loss of genes from the recent duplication event in the <it>B. rapa </it>genome</p>
            </st>
            <p>To deduce the approximate time point of polyploidy and speciation, we compared the distribution of synonymous substitution (Ks) in homologous sequences identified by a reciprocal best BLAST hit search between <it>Br </it>and the completely annotated sequences of <it>At</it>, <it>Pt</it>, <it>Mt</it>, and <it>Os</it>. As shown in Figure <figr fid="F4">4a-c</figr>, <it>Br </it>shares a single ancient duplication event (1R) with <it>Os</it>, <it>Pt</it>, and <it>Mt </it>as illustrated by single peaks at Ks modes of 2.5 to 2.6, 2.2 to 2.3, and 1.8 to 1.9, respectively, indicating successive splitting of the <it>Br </it>lineage from monocots and eurosid I during the early and late Cretaceous period around 60 to 120 MYA, depending on the neutral substitution rate used <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. The age distributions of <it>At </it>and <it>Br </it>yield clear peaks corresponding to 2R at Ks = 1.7 to 1.8 and 1.8 to 1.9, respectively, lower than that of the <it>Br</it>-<it>Pt </it>comparison but similar to that of the <it>Br</it>-<it>Mt </it>comparison (Figure <figr fid="F4">4e, f</figr>). This suggests that an ancient burst of gene duplications due to the 2R event in <it>At </it>and <it>Br </it>must have occurred almost immediately after divergence between eurosid I and eurosid II. Taken together with recent studies of the <it>Pt </it><abbrgrp><abbr bid="B9">9</abbr></abbrgrp> and <it>Mt </it>genomes <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, we conclude that genome duplication in rosids occurred independently after the split from the last common rosid ancestor, and that most polyploidy events (2R, 3R, and 4R) in Brassicaceae postdate the eurosid I (<it>Pt </it>and <it>Mt</it>)-eurosid II (<it>At </it>and <it>Br</it>) divergence.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Traces of polyploidy events in plant genomes</p>
               </caption>
               <text>
                  <p>Traces of polyploidy events in plant genomes. <b>(a-f) </b>The distribution of Ks values obtained from comparisons of sets of putative orthologous genome sequences between <it>Br </it>and the selected model plant species <it>Os </it>(a), <it>Pt </it>(b), <it>Mt </it>(c), and <it>At </it>(d), and from paralogous sequences in <it>At </it>(e) and <it>Br </it>(f) genomes. The vertical axes indicate the frequency of paired sequences, while the horizontal axes denote Ks values with an interval of 0.1. The black bars depict the positions of the modes of Ks distributions obtained from orthologous or paralogous gene pairs. <it>At</it>, <it>A. thaliana</it>; <it>Br</it>, <it>B. rapa</it>; <it>Mt</it>, <it>Medicago truncatula</it>; <it>Os</it>, <it>O. sativa</it>; <it>Pt</it>, <it>Populus trichocarpa</it>.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-4"/>
            </fig>
            <p>The Ks distribution for <it>At </it>and <it>Br </it>orthologs displayed two peaks at Ks = 0.3 to 0.4 and 2.0 to 2.1, corresponding to shared duplication events (3R and 2R) and speciation between the genomes at around 13 to 17 MYA (Figure <figr fid="F4">4d</figr>). As reported before, the oldest duplication (1R) could not be seen in the Ks distributions in both genomes. Surprisingly, a comparison of the Ks mode for the paralogs in <it>At </it>and <it>Br </it>identified remarkable differences in the duplicated genes retained in the two genomes. Furthermore, the <it>At </it>genome has two clear peaks for 3R (mode Ks = 0.6 to 0.7) and 2R (mode Ks = 1.7 to 1.8). However, in the <it>Br </it>genome, two peaks representing 4R (mode Ks = 0.2 to 0.3) and 2R (mode Ks = 1.8 to 1.9) are evident, but the 3R peak has collapsed (Figure <figr fid="F4">4e, f</figr>). The difference between the distributions for <it>Br</it>-<it>Br </it>versus <it>Br</it>-<it>At </it>(<it>P </it>= 1.65E<sup>-8</sup>) was significantly higher than that for <it>At</it>-<it>At </it>versus <it>Br</it>-<it>At </it>(<it>P </it>= 0.001). Taken together, these findings suggest that duplicated genes produced by the 3R event were widely lost in the triplicated <it>Br </it>genome.</p>
            <p>Because we used approximately 30% of the euchromatic sequence of <it>Br</it>, we could have underestimated the 3R event due to biased sampling. To test this possibility, we analyzed the Ks distribution using ESTs. The age distribution of <it>Br </it>based on approximately 120,000 ESTs showed a pattern essentially identical to that obtained using the genome sequence data, illustrating loss of the 3R peak (Figure <figr fid="F5">5a</figr>). The additional peak for Ks = 0.10 to 0.15 may represent a very recent segmental duplication event. Loss of the 3R event appears to be specific to <it>Br </it>amongst <it>Brassica </it>genomes (Figure <figr fid="F5">5b-f</figr>); a <it>Bo</it>-<it>Bo </it>comparison yielded a Ks distribution different to that of <it>Br</it>-<it>Br</it>, with a clear peak corresponding to 3R (mode Ks = 0.85 to 0.90). A similar pattern was observed in the <it>Bna</it>-<it>Bna </it>comparison with underestimation of the peaks for 3R. However, note that the Ks modes for ortholog comparison between <it>Br </it>and <it>Bo</it>, <it>Bo </it>and <it>Bna</it>, and <it>Br </it>and <it>Bna </it>showed very similar Ks distribution with the two peaks for 4R and 2R at similar Ks modes as those in <it>Br</it>-<it>Br </it>paralog analyses, but loss of a peak for 3R. In particular, when the interval of Ks for the <it>Br</it>-<it>Bo </it>comparison was magnified, one additional peak, lying slightly below that for 4R at Ks = 0.34 to 0.36, was identified at Ks = 0.22 to 0.24; this indicates the genome split at around 8 MYA (Figure <figr fid="F5">5g</figr>).</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Traces of polyploidy events in the <it>Brassica </it>'A' and 'C' genomes</p>
               </caption>
               <text>
                  <p>Traces of polyploidy events in the <it>Brassica </it>'A' and 'C' genomes. <b>(a-g) </b>Distributions of Ks values were obtained from comparisons of sets of paralogous EST sequences in <it>Br </it>(a), <it>Bo </it>(b), and <it>Bna </it>(c) and comparisons of putative orthologous EST sequences between the genomes (d-g). The vertical axes indicate the frequency of paired sequences, and the horizontal axes denote Ks values at 0.05 (a-f) or 0.02 (g) intervals. The black bars indicate the positions of the modes of Ks distributions obtained from comparisons of orthologous or paralogous gene pairs. <it>Bna</it>, <it>B</it>. <it>napus</it>; <it>Bo</it>, <it>B. oleracea</it>; <it>Br</it>, <it>B. rapa</it>.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-5"/>
            </fig>
            <p>Detection of a peak reflecting 3R in the <it>Bo </it>and <it>Bna </it>genomes but absence of this peak in the <it>Br </it>genome and between the other <it>Brassica </it>genomes strongly supports the hypothesis that duplicated genes from the 3R event were lost in the <it>Br </it>genome due to gradual deletion or suppression, presumably due to functional redundancy in the polyploid genome. To further explore this hypothesis, we compared the degree of conservation of duplicated genes in the sister blocks resulting from 3R and 4R. We found that 33 and 18 sister block pairs were selected for in the 3R and 4R events in the <it>Br </it>genome, respectively (Table S4 in Additional data file 1). The degree of conservation of duplicated genes for 4R was 44%, almost the same as that of the triplicated <it>FLC </it>region <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, but only 20% for 3R, a value approximately twofold lower than that of <it>Bo </it>based on calculations from published data <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. This suggests greater deletion of duplicated genes in <it>Br </it>than <it>Bo </it>(Table <tblr tid="T4">4</tblr>; Tables S4 and S5 in Additional data file 1).</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>Comparison of the degree of conservation between duplicated groups originating from different polyploidy events in <it>B. rapa </it>and <it>B. oleracea</it></p>
               </caption>
               <tblbdy cols="6">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Number of groups produced</b>
                        </p>
                     </c>
                     <c cspan="3" ca="center">
                        <p>
                           <b>Number of genes*</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Degree of conservation</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Duplication event</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Total</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Unpaired</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Conserved</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>(%)<sup>&#8224;</sup></b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>B. rapa</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>3R event</p>
                     </c>
                     <c ca="center">
                        <p>33</p>
                     </c>
                     <c ca="center">
                        <p>2,017</p>
                     </c>
                     <c ca="center">
                        <p>1,623</p>
                     </c>
                     <c ca="center">
                        <p>394</p>
                     </c>
                     <c ca="center">
                        <p>19.5</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>4R event</p>
                     </c>
                     <c ca="center">
                        <p>18 (3)</p>
                     </c>
                     <c ca="center">
                        <p>651 (112)</p>
                     </c>
                     <c ca="center">
                        <p>367 (58)</p>
                     </c>
                     <c ca="center">
                        <p>284 (54)</p>
                     </c>
                     <c ca="center">
                        <p>43.6 (48.2)</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Segmental duplication</p>
                     </c>
                     <c ca="center">
                        <p>1 (1)</p>
                     </c>
                     <c ca="center">
                        <p>24 (28)</p>
                     </c>
                     <c ca="center">
                        <p>4 (0)</p>
                     </c>
                     <c ca="center">
                        <p>20 (28)</p>
                     </c>
                     <c ca="center">
                        <p>83.3 (100)</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>B. oleracea</it>
                           <sup>&#8225;</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>3R event</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>310</p>
                     </c>
                     <c ca="center">
                        <p>196</p>
                     </c>
                     <c ca="center">
                        <p>114</p>
                     </c>
                     <c ca="center">
                        <p>36.8</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>4R event</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>217</p>
                     </c>
                     <c ca="center">
                        <p>81</p>
                     </c>
                     <c ca="center">
                        <p>136</p>
                     </c>
                     <c ca="center">
                        <p>62.7</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Data in parentheses are those from the <it>Flowering Locus C </it>(<it>FLC</it>) regions <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. *Tandem duplicated genes were considered to be a single homolog. <sup>&#8224;</sup>The degree of conservation was calculated by dividing the number of conserved genes by the total number of genes. <sup>&#8225;</sup>Information about the <it>Bo </it>genome was obtained from the report of Town <it>et al</it>. <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>.</p>
               </tblfn>
            </tbl>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <sec>
            <st>
               <p>A comparative genomics approach to target the euchromatic gene space of a crop genome</p>
            </st>
            <p>Investigation of crop genomes not only offers information that can be used for agricultural improvement, but also provides opportunities to understand angiosperm biology and evolution. As of 2009, the genome sequences of only five economically important crop plants (rice, poplar, grape, papaya, and sorghum) have been published <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>, and whole genome sequencing projects are currently underway for only a few selected crop species. One hurdle faced when sequencing a crop genome is genome obesity due to polyploidy and repetitive DNA <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>. Therefore, a stepwise approach is required to obtain genome-wide information from crop genomes, and strategies for targeting gene-rich fractions are required. In combination with EST sequencing, two approaches - methylation filtration <abbrgrp><abbr bid="B42">42</abbr></abbrgrp> and Cot-based cloning and sequencing <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> - were developed to capture euchromatic regions. Although both methods enrich for gene-rich fractions, they can exclude transcriptionally suppressed regions or euchromatic regions with abundant interspersed repetitive sequences (tandem repeats). We applied a novel gene space targeting method by allocating BAC clones to a closely related model genome based on BAC end sequence (BES) matches; this approach has not previously been reported in a genome sequencing project. This method has several advantages. First, gene-rich fractions of the crop genome can be obtained successfully <it>in silico </it>without additional experiments. We collected approximately 30% of the euchromatic region of <it>B. rapa </it>in this study. If a greater overlap between the clones and target region is allowed, and additional information in the form of genetic maps and physical contigs is used, the gene-rich fraction recovered is likely to increase significantly. Second, clone-by-clone strategies used in genome sequencing can benefit directly from this method because of selection of gene-rich seed BACs as well as the alignment of sequence scaffolds. Quick selection of a sufficient number of gene-rich seed BACs and directed ordering of the sequence scaffold will likely accelerate clone-based whole genome sequencing at reduced cost. The BAC clones selected in this study can be used as seed BACs for the ongoing clone-by-clone genome sequencing of <it>Br </it><abbrgrp><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>. Third, this analysis allows investigation of syntenic relationships between wild and crop genomes, thereby informing our understanding of crop evolution. Integration of genomes based on sequence level comparisons can offer a platform for the correlation between specific genes and phenotypes, which is important for further improvement of crops. We anticipate that application of our method will accelerate knowledge spreading from nodal model species to closely related taxa. For example, genome sequencing of other <it>Brassica </it>crops, particularly the construction of sequence assemblies and scaffolds of <it>Bna</it>, can benefit from the information obtained from the <it>Br </it>genome; this holds true even for next-generation sequencing. Thus, we anticipate that this study will make a significant contribution to structural and comparative genomic studies of crop species.</p>
         </sec>
         <sec>
            <st>
               <p>Counterbalancing genome obesity after whole genome triplication in <it>B. rapa</it></p>
            </st>
            <p>A large-scale comparison of <it>Br </it>genomic sequences and the whole euchromatic region of <it>At </it>demonstrated extensive synteny between the genomes, and provided clear evidence of a recent WGT event in the <it>Brassica </it>lineage. Our results significantly expand on previous observations of synteny between <it>At </it>and <it>Br </it>based on comparative genetic mapping <abbrgrp><abbr bid="B23">23</abbr></abbrgrp> and small-scale comparisons of homologous regions <abbrgrp><abbr bid="B20">20</abbr></abbrgrp> by deciphering the start-end points of macrosynteny blocks and elucidating the fine-scale details of microsynteny within the syntenic regions more accurately. Even though the <it>Br </it>sequencing project is still underway and the sequences used in this study are incomplete, the scale of synteny between the two genomes at both the macro- and micro-levels is significant. As the <it>Br </it>sequencing project moves forward, the availability of nearly complete coverage of the euchromatin will enable more precise definition of syntenic blocks between <it>At </it>and <it>Br</it>, which can be used to reconstruct ancestral chromosome sequences of <it>Brassica</it>.</p>
            <p>Despite the WGT event, the total number of genes in the <it>Br </it>genome was estimated to be approximately 53,000, which is only a twofold increase compared with that of <it>At</it>. The usual fate of a duplicate-gene pair in a polyploid genome is nonfunctionalization or the deletion of one copy <abbrgrp><abbr bid="B44">44</abbr><abbr bid="B45">45</abbr><abbr bid="B46">46</abbr></abbrgrp>. The reduction in the overall number of genes in the triplicated <it>Br </it>genome can be regarded as a result of a process that restores the diploid state, thereby counterbalancing genome obesity. This process seemed to be driven by the deletion of redundant genome components at the level of both the chromosome and the gene. A genome-wide synteny comparison between <it>Br </it>and <it>At </it>revealed that some of the triplicated copies of <it>Br </it>segments were lost or reconstructed. In addition, microsynteny analysis also indicated a relatively shrunken genome throughout the entire euchromatic region of the <it>Br </it>genome, with the <it>Br </it>gene space occupying a fraction 30% smaller than that of <it>At </it>due to a higher frequency of deletion events in the <it>Br </it>genome. A previous study reported that in the <it>At </it>genome, genes with regulatory functions, such as those encoding transcription factors or genes involved in signal transduction, were retained significantly more often than genes with other molecular functions <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. However, we did not find differential retention of genes according to molecular function, which suggests random deletion of redundant genes in triplicated regions of the <it>Br </it>genome before functional diversification.</p>
            <p>Several mechanisms responsible for post-polyploid changes have been proposed. These include chromosome rearrangements caused by unequal crossing-over, homologous recombination, translocation, or other cytogenetic events <abbrgrp><abbr bid="B47">47</abbr><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr><abbr bid="B50">50</abbr></abbrgrp>. A tandem array with high sequence similarity would be a good candidate for deletion, because it is more likely to recombine and less likely to have a severe phenotype when one redundant gene is deleted. Fewer tandem duplicate genes in the <it>Br </it>genome may, therefore, be attributable to an increase in the rate of deletion. Incidentally, because polyploidy itself is a form of genomic 'disturbance,' it might induce a cellular response such as epigenetic silencing by hypermethylation, which may be especially relevant to genome evolution <abbrgrp><abbr bid="B48">48</abbr></abbrgrp>. As a result, the epigenetic response itself may accelerate the rate of mutation, thereby causing rapid genomic change as seen in <it>Br</it>. In addition, polyploidy could increase transposable element activity, causing the deletion of genes or even chromosome segments. Illegitimate recombination of TEs has been demonstrated to have the ability to remove large blocks of DNA in <it>Arabidopsis</it>, rice, <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B49">49</abbr></abbrgrp> and wheat <abbrgrp><abbr bid="B51">51</abbr></abbrgrp>. We speculate that the twofold increase in transposon accumulation in the triplicated euchromatic regions of <it>Br </it>compared to the euchromatic counterpart regions of <it>At </it>might be correlated with the deletion of duplicated genes.</p>
         </sec>
         <sec>
            <st>
               <p>Evolution of the <it>Brassica </it>'A' genome</p>
            </st>
            <p>Multiple rounds of polyploidy are thought to have occurred during angiosperm evolution, although the number and timing of polyploidy events vary between plant groups <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B52">52</abbr></abbrgrp>. Thus, most modern plant genomes harbor evidence of multiple rounds of past polyploidization. The genome evolution of Brassicaceae has been inferred mainly from studying <it>Arabidopsis</it>. There is evidence from several studies for one round of genome duplication after the eudicot divergence and additional rounds of polyploidization following the divergence of <it>Arabidopsis </it>from its common ancestor with cotton <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. In this study, we refined inferences of the number and timing of polyploidy events, and we now discuss the impact of these events on the structure and evolution of the <it>Brassica </it>'A' genome (Figure <figr fid="F6">6</figr>). Ks estimates suggest that the <it>Brassica </it>genome shared two genome duplication events (2R and 3R) with <it>Arabidopsis </it>postdating the eurosid I (<it>Pt </it>and <it>Mt</it>) and eurosid II (<it>At </it>and <it>Br</it>) divergence. The third polyploidy event (4R) was a <it>Brassica </it>lineage-specific whole genome triplication after the split of <it>Brassica </it>from the common ancestor of <it>Brassica </it>and <it>Arabidopsis</it>. The 227 synteny blocks identified between <it>Br </it>and <it>At </it>can serve as a basis for reconstruction of the ancestral genome and chromosomes of the <it>Br</it>-<it>At </it>ancestor, although a more complete genome sequence and additional evidence are still required. The mapping of ancestral chromosome building blocks to the <it>Br </it>genome strongly suggests that the <it>Br </it>genome evolved from a pre-triplicated ancestor with a unique organization of the retracted <it>AK</it>, which was different from that of <it>At</it>, by chromosomal rearrangement shortly after 3R but prior to 4R. This event might have resulted in the divergence of the <it>Arabidopsis </it>and <it>Brassica </it>lineages.</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Polyploidy events in the evolution of the <it>Brassica </it>genome</p>
               </caption>
               <text>
                  <p>Polyploidy events in the evolution of the <it>Brassica </it>genome. Each star indicates a WGD (1R, 2R, and 3R) or WDT (4R) event on the branch. Estimation of dates for polyploidy and speciation events are given in million years and are based on the Ks analysis performed in this study, except for the 1R event, which was inferred from a previous report <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. A geographic time-table is provided on the right border of the figure. <it>At</it>, <it>A. thaliana</it>; <it>Bna</it>, <it>B</it>. <it>napus</it>; <it>Bo</it>, <it>B. oleracea</it>; <it>Br</it>, <it>B. rapa</it>; <it>Mt</it>, <it>Medicago truncatula</it>; <it>Os</it>, <it>O. sativa</it>; <it>Pt</it>, <it>Populus trichocarpa</it>.</p>
               </text>
               <graphic file="gb-2009-10-10-r111-6"/>
            </fig>
            <p>More importantly, differential gene loss following 4R in the <it>Brassica </it>genome might be responsible for the diversification of the genome, based on the finding that significantly more genes duplicated as a result of 3R have been lost in <it>Br </it>than in <it>Bo</it>. However, it is not clear if duplicated genes from the 3R event that were retained in <it>Bo </it>have diverged functionally. It appears that the split between <it>Br </it>and <it>Bo </it>happened rapidly (0.1 Ks interval) compared to the <it>At</it>-<it>Brassica </it>split (0.3 Ks interval), perhaps due to differential retention of duplicated genes and genome recombination in the ancestral <it>Brassica </it>genome. These observations, along with the independent accumulation of repetitive sequences, may have facilitated speciation within the tribe <it>Brassiceae</it>, which contains approximately 240 highly diverse species. Further analysis and cross-comparisons of diploid and allopolyploid genomes of <it>Brassica </it>will enhance our understanding of the fate of duplicated genes in the <it>Brassica </it>genome. It appears that, as a counterbalance to genome obesity, there was higher selection pressure on redundant genes in the triplicated <it>Brassica </it>ancestor, accelerating gene loss in this triplicated ancestor compared to the <it>Arabidopsis</it>-<it>Brassica </it>common ancestor. Alternatively, differences in the life cycles of <it>Brassica </it>progenitors might have resulted in the differential deletion of duplicated genes in <it>Brassica </it>genomes. Moreover, artificial selection after domestication could also have had an impact on differentiation of diploid <it>Brassica </it>genomes. Taken together, the available evidence suggests that genome duplication and chromosomal diploidization are ongoing processes collectively driving the evolution of <it>Brassica </it>genomes.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusions</p>
         </st>
         <p>Comparisons of large-scale genomic sequences of <it>Br </it>and the whole euchromatic region of <it>At </it>revealed extensive synteny between the genomes due to at least two shared genome duplication events and a recent WGT event specific to the <it>Brassica </it>lineage. The reduction of the number of genes in the triplicated <it>Br </it>genome by approximately one-third can be regarded to be the result of a process counterbalancing genome obesity to regain the diploid state. Segmental loss of triplicated genome blocks and differential deletion of duplicated genes in <it>Br </it>along with less accumulation of transposons appear to have resulted in the small size of the <it>Br </it>genome (approximately 529 Mbp) compared to its sibling species, <it>Bo </it>(approximately 696 Mbp) and <it>Bn </it>(approximately 632 Mbp) <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. The events proposed here indicate that genome diploidization following polyploidy played an important role in the radiation of <it>Brassica</it>. Our results clarify the orthology between <it>Br </it>and <it>At </it>and establish a strong basis for the genome evolution of <it>Brassica</it>. All the sequenced BAC clones investigated in this study were provided to the <it>B. rapa </it>Genome Sequencing Project as seed BACs for use as starting points for chromosome sequencing.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>BAC selection, sequencing, and sequence contig assembly</p>
            </st>
            <p>We previously published an efficient and novel clone selection method based on <it>in silico </it>BES matches to a model genome, which we named the comparative tiling method <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>. To select gene-rich <it>Br </it>BAC clones covering the entire <it>At </it>euchromatic regions, a total of 92,000 BESs were allocated to <it>At </it>chromosomes by using BLASTZ at a cutoff of &lt;E<sup>-6 </sup>with both end matches at 30 to 500 kbp intervals. A total of 4,647 BAC clones were allocated to 92 Mbp of <it>At </it>euchromatic regions and 589 minimally overlapping BAC clones (292 overlapping clones with an average of 41 kbp overlaps and 297 singleton clones) were finally selected and sequenced using an ABI 3730xl sequencer. The minimal sequence goal was five phase 2 (fully oriented and ordered sequence with some small gaps and low quality sequences) contigs, but 18 clones (3%) were sequenced as phase 1 due to large repetitive sequences (Table S1 in Additional data file 1). To anchor clones, a combination of sequence-based genetic mapping <abbrgrp><abbr bid="B53">53</abbr></abbrgrp>, fingerprint contig data <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>, and fluorescent <it>in situ </it>hybridization (FISH) was used (Table S2 in Additional data file 1). The sequence contig assembly was created based on overlapping sequences. BAC sequences were assembled into big sequence contigs by first comparing paired BES matches and BAC sequences sharing overlapping positions on the target <it>At </it>chromosomes using Pipmaker <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>. Then, sequence contigs were assembled based on overlapping sequences using Phred/Phrap/Consed programs <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B57">57</abbr><abbr bid="B58">58</abbr></abbrgrp>. The location of sequence contigs or BAC singletons was determined primarily by genetic marker anchors with fingerprint contig information, paired BES, and FISH results providing additional information about local contig and BAC ordering. Pseudochromosome sequences were created by connecting sequence assemblies with 10-kbp additions of anonymous sequences. All the <it>Br </it>sequences used in this study are available at NCBI and the URL cited below in the 'Data used in this study' section and relevant reference sequence sources are listed in Table S6 in Additional data file 1.</p>
         </sec>
         <sec>
            <st>
               <p>Estimation of genome coverage and genome annotation</p>
            </st>
            <p>The sequence coverage of the <it>Br </it>genome by BACs was estimated by calculating the proportions of <it>Br </it>EST unigenes and conserved single-copy rosid genes with strong matches. For EST comparisons, we considered unigenes to have a genome match if more than 90% of unigenes matched with at least 95% identity in a BLAT <abbrgrp><abbr bid="B59">59</abbr></abbrgrp> analysis. For the single-copy rosid gene comparison, we created a list of 1,070 single-copy <it>At </it>and <it>Mt </it>genes not included in the <it>Br </it>EST collections. They were considered to have a genome match in <it>Br </it>if at least 50% of the gene matched in a TBLASTN <abbrgrp><abbr bid="B60">60</abbr></abbrgrp> search at a cutoff of &lt;E<sup>-100</sup>. The assembled sequences were masked using RepeatMasker <abbrgrp><abbr bid="B61">61</abbr></abbrgrp> using a dataset combining the plant repeat element database of the Munich Information Center for Protein Sequence (MIPS) <abbrgrp><abbr bid="B62">62</abbr></abbrgrp> and our specialized database of <it>Br </it>repetitive sequences. Gene model prediction was performed using EVidenceModeler <abbrgrp><abbr bid="B63">63</abbr></abbrgrp>. Putative exons and open reading frames were predicted <it>ab initio </it>using FGENESH <abbrgrp><abbr bid="B64">64</abbr></abbrgrp> and AUGUSTUS <abbrgrp><abbr bid="B65">65</abbr></abbrgrp> programs with the parameters trained using the <it>Br </it>matrix. To predict consensus gene structures, <it>Br </it>ESTs plus full-length cDNAs, plant transcripts, and plant protein sequences were aligned to the predicted genes using PASA <abbrgrp><abbr bid="B66">66</abbr></abbrgrp> and AAT <abbrgrp><abbr bid="B67">67</abbr></abbrgrp> packages. The predicted genes and evidence sequences were then assembled according to the weight of each evidence type using EVidenceModeler. The highest scoring set of connected exons, introns, and noncoding regions was selected as a consensus gene model. Proteins encoded by gene models were searched against the Pfam database <abbrgrp><abbr bid="B68">68</abbr></abbrgrp> and automatically assigned a putative name based on conserved domain hits or similarity with previously identified proteins. Annotated gene models were also searched against a database of plant transposon-encoded proteins <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. Predicted proteins with a top match to transposon-encoded proteins were excluded from the annotation and gene counts.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of syntenic blocks based on genome comparisons</p>
            </st>
            <p>Syntenic regions of the genomes of <it>Br </it>and <it>At </it>were identified by a proteome comparison based on BLASTP <abbrgrp><abbr bid="B60">60</abbr></abbrgrp> analysis. The entire proteomes of the two genomes were compared, and only the top reciprocal BLASTP matches per chromosome pair were selected (minimum of 50% alignment coverage at a cutoff of &lt;E<sup>-20</sup>). We chose to perform a BLASTP similarity search because it is inherently more sensitive than BLASTN <abbrgrp><abbr bid="B60">60</abbr></abbrgrp>. Moreover, the BLASTP hit matrix contains fewer BLAST hits that are due to repetitive nucleotide sequences. Chromosome scale synteny blocks were inferred by visual inspection of dot-plots using DiagHunter with parameters as described in Cannon <it>et al</it>. <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. Gene orientation, insertions/deletions, and inversions were considered, and at least four genes with the same respective orientations in both genomes were required to establish a primary candidate synteny block. To distinguish highly homologous real synteny blocks from false positives due to multiple rounds of polyploidy followed by genome rearrangement, we manually checked all the primary candidate blocks. Previous studies reported that the degree of gene conservation between <it>At </it>and the <it>Brassica </it>genome in several selected syntenic regions was >50%. Based on this result, 227 blocks showing a gene conservation index of >50% (twice the number of conserved matches divided by the total number of non-redundant genes in the blocks; tandem duplicated genes were collapsed to a single homolog) were selected as real syntenic regions. For microsynteny analysis, we manually broke the blocks if <it>At </it>homologs of independent <it>Br </it>sequences in the syntenic blocks were separated by more than 10 kbp. The synteny display is available online at the URL cited in the 'Data used in this study' section.</p>
         </sec>
         <sec>
            <st>
               <p>Ks analysis of homologous sequences</p>
            </st>
            <p>The timing of duplication events and the divergence of homologous segments was estimated by calculating the number of synonymous substitutions per synonymous site (Ks) between homologous genes. For the model genome comparisons, annotated gene models were used, whereas for the comparison between the <it>Brassica </it>genomes, ESTs were analyzed, even though they are error-prone. One drawback associated with the analysis of paralogs derived from ESTs is that multiple entries for the same gene can be included in the dataset, leading to overestimation of redundant Ks measures <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. However, it is reasonable to assume that redundant Ks measures are randomly distributed among all the Ks values; thus. the effect of redundancy is likely to have been neutral. Before comparing the Ks distribution for EST paralogs and genome sequences of <it>Br</it>, we carefully checked the patterns of Ks in the EST data; we did not find any significantly overestimated bulges or peaks. To identify orthologs and paralogs, the protein sequences of the gene models or ESTs were aligned using the all-against-all alignment and the resulting alignment was used as a reference to align the nucleotide sequences. After removing gaps, the Ks values from pairwise alignments of homologous sequences were determined using the maximum likelihood method implemented in the CODEML <abbrgrp><abbr bid="B70">70</abbr></abbrgrp> program of the PAML <abbrgrp><abbr bid="B71">71</abbr></abbrgrp> package under the F3&#215;4 model, similar to the analysis described by Blanc <it>et al</it>. <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. We compared the mode rather than the mean of Ks distributions, because the mode is not affected by bias due to incorrectly defined homolog pairs, which is partly responsible for unexpected overestimation of Ks. Only gene pairs with a Ks estimate of &lt;5 were considered for further evaluation and their Ks age distribution was calculated using the interval 0.02 to 0.1. Divergence time calculations were based on the neutral substitution rate of 1.5 &#215; 10<sup>-8 </sup>substitutions per site per year for chalcone synthase (<it>Chs</it>) and alcohol dehydrogenase (<it>Adh</it>) <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Gene conservation between sister blocks in the <it>B. rapa </it>genome</p>
            </st>
            <p>Because <it>Br </it>BAC clones were selected to minimally overlap the target <it>At </it>region, self comparison of <it>Br </it>sequences using the DiagHunter program found few duplicated regions (Figure S4 in Additional data file 2). Instead, we manually identified sister blocks of duplication events by using synteny group information between <it>Br </it>and <it>At</it>. <it>Br </it>sequence blocks were defined as putative sister blocks of 3R if two different sequence blocks showed high synteny with respect to <it>At </it>regions known to be duplicated remnants of 3R <abbrgrp><abbr bid="B72">72</abbr></abbrgrp>, whereas independent <it>Br </it>sequence blocks sharing the same syntenic relationship with a single <it>At </it>region were selected as sister blocks of 4R. For additional validation, we compared the Ks distribution modes between the paralog gene pairs in the sister blocks.</p>
         </sec>
         <sec>
            <st>
               <p>Data used in this study</p>
            </st>
            <p>All the data used in this study can be accessed online at <abbrgrp><abbr bid="B73">73</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p><it>AK</it>: ancestral karyotype; <it>At</it>: <it>Arabidopsis thaliana</it>; BAC: bacterial artificial chromosome; <it>Bc</it>: <it>Brassica carinata</it>; BES: BAC end sequence; <it>Bj</it>: <it>Brassica juncea</it>; <it>Bn</it>: <it>Brassica nigra</it>; <it>Bna</it>: <it>Brassica napus</it>; <it>Bo</it>: <it>Brassica oleracea</it>; <it>Br</it>: <it>Brassica rapa</it>; EST: expressed sequence tag; FISH: fluorescent <it>in situ </it>hybridization; kbp, kilobase-pairs; Ks: substitutions per synonymous site; LTR: long terminal repeat retrotransposon; Mbp: megabase-pair; <it>Mt</it>: <it>Medicago truncatula</it>; MYA: million years ago; NCBI: National Center for Biotechnology Information; <it>Os</it>: <it>Oryza sativa</it>; <it>Pt</it>: <it>Populus trichocarpa</it>; TE: transposable element; WGD: whole genome duplication; WGT: whole genome triplication.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>JHM designed research, performed the experiments, analyzed data, and wrote the manuscript. SJK and TJY designed research and contributed analytic tools. SJK, MJ, JAK, MHL, JSK, KBL, and SIL contributed to data acquisition. YJS and SB developed the database and interfaces to display results on the web. SB, BSC, HJY, DSK, NK, and JHH analyzed data. HJY, IB, and YPL participated in manuscript preparation. BSP conceived the project and supervised its execution.</p>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper: Tables S1, S2, S3, S4, S5 and S6 (Additional file <supplr sid="S1">1</supplr>); Figures S1, S2, S3 and S4 (Additional file <supplr sid="S2">2</supplr>); a spreadsheets listing synteny blocks between <it>Br </it>and <it>At </it>genomes (Additional file <supplr sid="S3">3</supplr>); spreadsheets describing genome blocks and block boundaries of the ancestral karyotype (<it>AK</it>) mapped on the <it>B. rapa </it>chromosomes based on <it>Br</it>-<it>At </it>synteny and <it>At</it>-<it>AK </it>correspondences (Additional file <supplr sid="S4">4</supplr>).</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Tables S1, S2, S3, S4, S5 and S6</p>
            </caption>
            <text>
               <p>Table S1: summary of <it>B. rapa </it>sequence contigs, constituent BAC associations, and targeting of homologous regions of <it>A. thaliana </it>based on BLASTZ matches. Table S2: location of sequence contigs on the <it>B. rapa </it>chromosomes according to a combination of genetic map position, FISH results, physical map contig, and positional information from <it>A. thaliana </it>counterparts. Table S3: statistics of microsynteny in the synteny blocks identified by a genome comparison of <it>B. rapa </it>and <it>A. thaliana</it>. Table S4: identification of sister blocks produced by the same polyploidy events in the <it>Br </it>genome based on <it>At</it>-<it>At </it>and <it>At</it>-<it>Br </it>relationships. Table S5: identification of sister blocks produced by the same polyploidy events in the <it>Bo </it>genome. Table S6: sources of genomic and transcript sequences used in this study.</p>
            </text>
            <file name="gb-2009-10-10-r111-S1.PDF">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Figures S1, S2, S3 and S4</p>
            </caption>
            <text>
               <p>Figure S1: comparison of homologous block end-point distances between 410 <it>B. rapa </it>sequence contigs and their <it>Arabidopsis </it>counterpart regions, indicating a genome shrinkage of approximately 30% in <it>B. rapa</it>. Figure S2: abundance of different transposable element types in the <it>B. rapa </it>genome. Figure S3: comparison of <it>Brassica </it>'A' genome structures between <it>B. rapa </it>and <it>B. napus</it>. Genome blocks were defined based on 24 <it>AK </it>genome building blocks. The genome structure of <it>Bna </it>was obtained from the reports of Parkin <it>et al</it>. <abbrgrp><abbr bid="B23">23</abbr></abbrgrp> and Schranz <it>et al</it>. <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. Regions characterized by significant rearrangements (pink box) or insertions/deletions (gray box) between genomes are highlighted by colored boxes. Scale bars on the margins indicate megabase-pairs (Mbp) for <it>Br </it>or centi-Morgans (cM) for <it>Bna</it>. Blocks with the opposite orientation relative to <it>AK </it>are indicated by a gray upward-pointing arrow on the right side of the block. Figure S4: dot plot of <it>B. rapa </it>compared with itself. Each dot in the dot plot represents a reciprocal best BLASTP match between gene pairs at a cutoff value of &lt;E<sup>-20</sup>. Red dots show the regions of synteny identified by DiagHunter.</p>
            </text>
            <file name="gb-2009-10-10-r111-S2.PDF">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Synteny blocks between <it>Br </it>and <it>At </it>genomes</p>
            </caption>
            <text>
               <p>The data provided include two worksheets. Gene correspondence data for the 227 synteny blocks identified by DiagHunter are provided in the worksheet entitled 'blocks.' The synteny quality of the blocks is included in the worksheet named 'quality'; tandem duplicated genes were considered to be single homologs. The quality of synteny was defined as described in the Materials and methods.</p>
            </text>
            <file name="gb-2009-10-10-r111-S3.ZIP">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Genome blocks and block boundaries of the ancestral karyotype (<it>AK</it>) mapped on the <it>B. rapa </it>chromosomes based on <it>Br</it>-<it>At </it>synteny and <it>At</it>-<it>AK </it>correspondences</p>
            </caption>
            <text>
               <p>This dataset indicates the block order, orientation, and color-coding used for each <it>AK </it>block. The synteny-defined block boundaries on the <it>Br </it>chromosomes identified by DiagHunter were defined according to the <it>At </it>locus name described by Schranz <it>et al</it>. <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. Supporting data, including gene correspondences in all synteny blocks, are included in the worksheet 'At-Br matches in synteny blocks'. Mapping of <it>AK </it>blocks to the <it>Br </it>chromosomes, including block boundaries and orientation, is provided in the worksheet '<it>AK </it>blocks to <it>Br</it>'. A summary table and graph of <it>AK </it>mapping to the <it>Br </it>chromosomes is provided in the worksheet 'Br chr. chart'.</p>
            </text>
            <file name="gb-2009-10-10-r111-S4.ZIP">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank the many participants in the Korea <it>Brassica rapa </it>Genome Project. Collaborators meriting special note include Hyung Tae Kim of Macrogen for BAC sequencing and Eu-Ki Kim of NIAB, RDA, and the Korean Bioinformation Center, KRIBB, for bioinformatics support. This work was supported by the National Academy of Agricultural Science (05-1-12-2-1, 200901FHT020710397, and 200901FHT020508369) and by the BioGreen 21 Program (20050301034438), Rural Development Administration, Korea.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Genome duplication and the origin of angiosperm.</p>
            </title>
            <aug>
               <au>
                  <snm>De Bodt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Maere</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Peer</snm>
                  <mnm>Van de</mnm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Trends Ecol Evol</source>
            <pubdate>2005</pubdate>
            <volume>20</volume>
            <fpage>591</fpage>
            <lpage>597</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tree.2005.07.008</pubid>
                  <pubid idtype="pmpid" link="fulltext">16701441</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>In search of the first flower: a Jurassic angiosperm, <it>Archaefructus</it>, from northeast China.</p>
            </title>
            <aug>
               <au>
                  <snm>Sun</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Dilcher</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1998</pubdate>
            <volume>282</volume>
            <fpage>1692</fpage>
            <lpage>1695</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.282.5394.1692</pubid>
                  <pubid idtype="pmpid" link="fulltext">9831557</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Archaefructaceae, a new basal angiosperm family.</p>
            </title>
            <aug>
               <au>
                  <snm>Sun</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Ji</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Dilcher</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Nixon</snm>
                  <fnm>KC</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>899</fpage>
            <lpage>904</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1069439</pubid>
                  <pubid idtype="pmpid" link="fulltext">11988572</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Evolution of DNA amounts across land plants (embryophyta).</p>
            </title>
            <aug>
               <au>
                  <snm>Leitch</snm>
                  <fnm>IJ</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>Bennett</snm>
                  <fnm>MD</fnm>
               </au>
            </aug>
            <source>Ann Bot</source>
            <pubdate>2005</pubdate>
            <volume>95</volume>
            <fpage>207</fpage>
            <lpage>217</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/aob/mci014</pubid>
                  <pubid idtype="pmpid">15596468</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Widespread paleopolyploidy in model plant species inferred from age distributions of duplicate genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2004</pubdate>
            <volume>16</volume>
            <fpage>1667</fpage>
            <lpage>1678</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.021345</pubid>
                  <pubid idtype="pmcid">514152</pubid>
                  <pubid idtype="pmpid" link="fulltext">15208399</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Widespread genome duplications throughout the history of flowering plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Cui</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wall</snm>
                  <fnm>PK</fnm>
               </au>
               <au>
                  <snm>Leebens-Mack</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Lindsay</snm>
                  <fnm>BG</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Doyle</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Arumuganathan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Barakat</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Albert</snm>
                  <fnm>VA</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>dePamphilis</snm>
                  <fnm>CW</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>738</fpage>
            <lpage>749</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.4825606</pubid>
                  <pubid idtype="pmcid">1479859</pubid>
                  <pubid idtype="pmpid" link="fulltext">16702410</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Analysis of the genome sequence of the flowering plant <it>Arabidopsis thaliana</it>.</p>
            </title>
            <aug>
               <au>
                  <cnm>The Arabidopsis Genome Initiative</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>408</volume>
            <fpage>796</fpage>
            <lpage>815</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35048692</pubid>
                  <pubid idtype="pmpid" link="fulltext">11130711</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>The map-based sequence of the rice genome.</p>
            </title>
            <aug>
               <au>
                  <cnm>International Rice Genome Sequencing Project</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2005</pubdate>
            <volume>436</volume>
            <fpage>793</fpage>
            <lpage>800</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03895</pubid>
                  <pubid idtype="pmpid" link="fulltext">16100779</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>The genome of black cottonwood, <it>Populus trichocarpa </it>(Torr. &amp; Gray).</p>
            </title>
            <aug>
               <au>
                  <snm>Tuskan</snm>
                  <fnm>GA</fnm>
               </au>
               <au>
                  <snm>Difazio</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Jansson</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bohlmann</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Grigoriev</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hellsten</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Putnam</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Ralph</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rombauts</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Salamov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schein</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sterck</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Aerts</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bhalerao</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Bhalerao</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Blaudez</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Boerjan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Brun</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Brunner</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Busov</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Campbell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chalot</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>GL</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Coutinho</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Couturier</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Covert</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cronk</snm>
                  <fnm>Q</fnm>
               </au>
               <etal/>
            </aug>
            <source>Science</source>
            <pubdate>2006</pubdate>
            <volume>313</volume>
            <fpage>1596</fpage>
            <lpage>1604</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1128691</pubid>
                  <pubid idtype="pmpid" link="fulltext">16973872</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>The grapevine genome sequence suggests ancestral hexaploidization in major angiosperm phyla.</p>
            </title>
            <aug>
               <au>
                  <cnm>The French-Italian Public Consortium for Grapevine Genome Characterization</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>449</volume>
            <fpage>463</fpage>
            <lpage>468</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature06148</pubid>
                  <pubid idtype="pmpid" link="fulltext">17721507</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The draft genome of the transgenic tropical fruit tree papaya (<it>Carica papaya </it>Linnaeus).</p>
            </title>
            <aug>
               <au>
                  <snm>Ming</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hou</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Dionne-Laporte</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Saw</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Senin</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Ly</snm>
                  <fnm>BV</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Skelton</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Murray</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Qian</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Du</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Eustice</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Tong</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Tang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lyons</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Paull</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Michael</snm>
                  <fnm>TP</fnm>
               </au>
               <au>
                  <snm>Wall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Rice</snm>
                  <fnm>DW</fnm>
               </au>
               <au>
                  <snm>Albert</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>YJ</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2008</pubdate>
            <volume>452</volume>
            <fpage>991</fpage>
            <lpage>996</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature06856</pubid>
                  <pubid idtype="pmpid" link="fulltext">18432245</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>The <it>Sorghum bicolor </it>genome and the diversification of grasses.</p>
            </title>
            <aug>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Bowers</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Bruggmann</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dubchak</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Grimwood</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Gundlach</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Haberer</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Hellsten</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Mitros</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Poliakov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schmutz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Spannagl</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Tang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wicker</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Bharti</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Feltus</snm>
                  <fnm>FA</fnm>
               </au>
               <au>
                  <snm>Gowik</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Grigoriev</snm>
                  <fnm>IV</fnm>
               </au>
               <au>
                  <snm>Lyons</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Maher</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Martis</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Narechania</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Otillar</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Penning</snm>
                  <fnm>BW</fnm>
               </au>
               <au>
                  <snm>Salamov</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Carpita</snm>
                  <fnm>NC</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2009</pubdate>
            <volume>457</volume>
            <fpage>551</fpage>
            <lpage>556</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature07723</pubid>
                  <pubid idtype="pmpid" link="fulltext">19189423</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Analysis of retrotransposon structural diversity uncovers properties and propensities in angiosperm genome evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Vitte</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>17638</fpage>
            <lpage>17643</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.0605618103</pubid>
                  <pubid idtype="pmcid">1693799</pubid>
                  <pubid idtype="pmpid" link="fulltext">17101966</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Functional divergence of duplicated genes formed by polyploidy during <it>Arabidopsis </it>evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2004</pubdate>
            <volume>16</volume>
            <fpage>1679</fpage>
            <lpage>1691</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.021410</pubid>
                  <pubid idtype="pmcid">514153</pubid>
                  <pubid idtype="pmpid" link="fulltext">15208398</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Genome size reduction through illegitimate recombination counteracts genome expansion in <it>Arabidopsis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Devos</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>1075</fpage>
            <lpage>1079</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.132102</pubid>
                  <pubid idtype="pmcid">186626</pubid>
                  <pubid idtype="pmpid" link="fulltext">12097344</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Structure and evolution of cereal genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Bowers</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Estill</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Curr Opin Genet Dev</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <fpage>644</fpage>
            <lpage>650</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.gde.2003.10.002</pubid>
                  <pubid idtype="pmpid" link="fulltext">14638328</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Estimating genome conservation between crop and model legume species.</p>
            </title>
            <aug>
               <au>
                  <snm>Choi</snm>
                  <fnm>HK</fnm>
               </au>
               <au>
                  <snm>Mun</snm>
                  <fnm>J-H</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Baek</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ellis</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Doyle</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kiss</snm>
                  <fnm>GB</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Cook</snm>
                  <fnm>DR</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>15289</fpage>
            <lpage>15294</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.0402251101</pubid>
                  <pubid idtype="pmcid">524433</pubid>
                  <pubid idtype="pmpid" link="fulltext">15489274</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Legume genome evolution viewed through the <it>Medicago truncatula </it>and <it>Lotus japonicus </it>genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Cannon</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Sterck</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Rombauts</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cheung</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Gouzy</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Vasdewani</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schiex</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Spannagl</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Monaghan</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Nicholson</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Humphray</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Schoof</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Mayer</snm>
                  <fnm>KF</fnm>
               </au>
               <au>
                  <snm>Rogers</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Qu&#233;tier</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Oldroyd</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Debell&#233;</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Cook</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Retzel</snm>
                  <fnm>EF</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Town</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Tabata</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Peer</snm>
                  <mnm>Van de</mnm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>14959</fpage>
            <lpage>14964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.0603228103</pubid>
                  <pubid idtype="pmcid">1578499,1578499</pubid>
                  <pubid idtype="pmpid" link="fulltext">17003129</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Comparative genomics of <it>Brassica oleracea </it>and <it>Arabidopsis thaliana </it>reveal gene loss, fragmentation, and dispersal after polyploidy.</p>
            </title>
            <aug>
               <au>
                  <snm>Town</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Cheung</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Maiti</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Hine</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Althoff</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Arbogast</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Tallon</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Vigouroux</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Trick</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bancroft</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2006</pubdate>
            <volume>18</volume>
            <fpage>1348</fpage>
            <lpage>1359</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.106.041665</pubid>
                  <pubid idtype="pmcid">1475499</pubid>
                  <pubid idtype="pmpid" link="fulltext">16632643</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Sequence-level analysis of the diploidization process in the triplicated <it>FLOWERING LOCUS C </it>region of <it>Brassica rapa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Kwon</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>KB</fnm>
               </au>
               <au>
                  <snm>Choi</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Kang</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Hong</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Bhak</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bancroft</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2006</pubdate>
            <volume>18</volume>
            <fpage>1339</fpage>
            <lpage>1347</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.105.040535</pubid>
                  <pubid idtype="pmcid">1475497</pubid>
                  <pubid idtype="pmpid" link="fulltext">16632644</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Brassicaceae phylogeny and trichome evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Beilstein</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Al-Shehbaz</snm>
                  <fnm>IA</fnm>
               </au>
               <au>
                  <snm>Kellogg</snm>
                  <fnm>EA</fnm>
               </au>
            </aug>
            <source>Am J Bot</source>
            <pubdate>2006</pubdate>
            <volume>93</volume>
            <fpage>607</fpage>
            <lpage>619</lpage>
            <xrefbib>
               <pubid idtype="doi">10.3732/ajb.93.4.607</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Economic Research Service, USDA: Vegetables and Melons Outlook</p>
            </title>
            <url>http://www.ers.usda.gov/Publications/VGS/Tables/World.pdf</url>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Segmental structure of the <it>Brassica napus </it>genome based on comparative analysis with <it>Arabidopsis thaliana</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Parkin</snm>
                  <fnm>IA</fnm>
               </au>
               <au>
                  <snm>Gulden</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Sharpe</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Lukens</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Trick</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Osborn</snm>
                  <fnm>TC</fnm>
               </au>
               <au>
                  <snm>Lydiate</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2005</pubdate>
            <volume>171</volume>
            <fpage>765</fpage>
            <lpage>781</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1534/genetics.105.042093</pubid>
                  <pubid idtype="pmcid">1456786</pubid>
                  <pubid idtype="pmpid">16020789</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Comparison of a <it>Brassica oleracea </it>genetic map with the genome of <it>Arabidopsis thaliana</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lukens</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zou</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Lydiate</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Parkin</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Osborn</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2003</pubdate>
            <volume>164</volume>
            <fpage>359</fpage>
            <lpage>372</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1462567</pubid>
                  <pubid idtype="pmpid">12750346</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>A recent polyploidy superimposed on older large-scale duplications in the <it>Arabidopsis </it>genome.</p>
            </title>
            <aug>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Hokamp</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <fpage>137</fpage>
            <lpage>144</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.751803</pubid>
                  <pubid idtype="pmcid">420368</pubid>
                  <pubid idtype="pmpid" link="fulltext">12566392</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Chromosome triplication found across the tribe <it>Brassiceae</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lysak</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Koch</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Pecinka</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schubert</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2005</pubdate>
            <volume>15</volume>
            <fpage>516</fpage>
            <lpage>525</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.3531105</pubid>
                  <pubid idtype="pmcid">1074366</pubid>
                  <pubid idtype="pmpid" link="fulltext">15781573</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p><it>Brassica </it>Genome Gateway.</p>
            </title>
            <url>http://brassica.bbsrc.ac.uk</url>
         </bibl>
         <bibl id="B28">
            <title>
               <p>The Korea <it>Brassica rapa </it>Genome Project</p>
            </title>
            <url>http://www.brassica-rapa.org/BRGP/index.jsp</url>
         </bibl>
         <bibl id="B29">
            <title>
               <p>The Korea <it>Brassica </it>Genome Projects: a glimpse of the <it>Brassica </it>genome based on comparative genome analysis with <it>Arabidopsis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>KB</fnm>
               </au>
               <au>
                  <snm>Kwon</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Comp Funct Genomics</source>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <fpage>138</fpage>
            <lpage>146</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1002/cfg.465</pubid>
                  <pubid idtype="pmpid" link="fulltext">18629219</pubid>
                  <pubid idtype="pmcid">2447515</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Evolution of genome size in Brassicaceae.</p>
            </title>
            <aug>
               <au>
                  <snm>Johnston</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Pepper</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>ZJ</fnm>
               </au>
               <au>
                  <snm>Hodnett</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Drabek</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lopez</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Price</snm>
                  <fnm>HJ</fnm>
               </au>
            </aug>
            <source>Ann Bot</source>
            <pubdate>2005</pubdate>
            <volume>95</volume>
            <fpage>229</fpage>
            <lpage>235</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/aob/mci016</pubid>
                  <pubid idtype="pmcid">1950721</pubid>
                  <pubid idtype="pmpid">15596470</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Genome-wide analysis of NBS-LRR-encoding genes in <it>Arabidopsis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Meyers</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Kozik</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Griego</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kuang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Michelmore</snm>
                  <fnm>RW</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2003</pubdate>
            <volume>15</volume>
            <fpage>809</fpage>
            <lpage>834</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.009308</pubid>
                  <pubid idtype="pmcid">152331</pubid>
                  <pubid idtype="pmpid" link="fulltext">12671079</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Genome-wide identification of NBS-encoding resistance genes in <it>Brassica rapa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Mun</snm>
                  <fnm>J-H</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>H-J</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>B-S</fnm>
               </au>
            </aug>
            <source>Mol Genet Genomics</source>
            <pubdate>2009</pubdate>
            <note>doi: 10.1007/s00438-009-0492-0</note>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">19838736</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Genome-wide comparative analysis of the transposable elements in the related species <it>Arabidopsis thaliana </it>and <it>Brassica oleracea</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wessler</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>5589</fpage>
            <lpage>5594</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.0401243101</pubid>
                  <pubid idtype="pmcid">397431</pubid>
                  <pubid idtype="pmpid" link="fulltext">15064405</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Characterization of the centromere and peri-centromere retrotransposons in <it>Brassica rapa </it>and their distribution in related <it>Brassica </it>species.</p>
            </title>
            <aug>
               <au>
                  <snm>Lim</snm>
                  <fnm>KB</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Hwang</snm>
                  <fnm>YJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Kwon</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Choi</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>de Jong</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Bancroft</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Plant J</source>
            <pubdate>2007</pubdate>
            <volume>49</volume>
            <fpage>173</fpage>
            <lpage>183</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-313X.2006.02952.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">17156411</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Terminal repeat retrotransposon in miniature (TRIM) as DNA markers in <it>Brassica </it>relatives.</p>
            </title>
            <aug>
               <au>
                  <snm>Kwon</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Long</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Meng</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>KB</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>Ahn</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Wessler</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Mol Genet Genomics</source>
            <pubdate>2007</pubdate>
            <volume>278</volume>
            <fpage>361</fpage>
            <lpage>370</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00438-007-0249-6</pubid>
                  <pubid idtype="pmpid" link="fulltext">17690909</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>DiagHunter and GenoPix2D: programs for genomic comparisons, large-scale homology discovery and visualization.</p>
            </title>
            <aug>
               <au>
                  <snm>Cannon</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Kozik</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Chan</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Michelmore</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>R68</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/gb-2003-4-10-r68</pubid>
                  <pubid idtype="pmcid">328457</pubid>
                  <pubid idtype="pmpid" link="fulltext">14519203</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>The ABC's of comparative genomics in the Brassicaceae: building blocks of crucifer genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Schranz</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Lysak</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Mitchell-Olds</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Trends Plant Sci</source>
            <pubdate>2006</pubdate>
            <volume>11</volume>
            <fpage>535</fpage>
            <lpage>542</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tplants.2006.09.002</pubid>
                  <pubid idtype="pmpid" link="fulltext">17029932</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Mechanisms of chromosome number reduction in <it>Arabidopsis thaliana </it>and related Brassicaceae species.</p>
            </title>
            <aug>
               <au>
                  <snm>Lysak</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Berr</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Pecinka</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>McBreen</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Schubert</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>5224</fpage>
            <lpage>5229</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.0510791103</pubid>
                  <pubid idtype="pmcid">1458822</pubid>
                  <pubid idtype="pmpid" link="fulltext">16549785</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>History, protohistory and prehistory of the <it>Arabidopsis thaliana </it>chromosome complement.</p>
            </title>
            <aug>
               <au>
                  <snm>Henry</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Bedhomme</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Trends Plant Sci</source>
            <pubdate>2006</pubdate>
            <volume>11</volume>
            <fpage>267</fpage>
            <lpage>273</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tplants.2006.04.002</pubid>
                  <pubid idtype="pmpid" link="fulltext">16690345</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Comparative evolutionary analysis of chalcone synthase and alcohol dehydrogenase loci in <it>Arabidopsis</it>, <it>Arabis</it>, and related genera (Brassicaceae).</p>
            </title>
            <aug>
               <au>
                  <snm>Koch</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Haubold</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Mitchell-Olds</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2000</pubdate>
            <volume>17</volume>
            <fpage>1483</fpage>
            <lpage>1498</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11018155</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Leafing through the genomes of our major crop plants: strategies for capturing unique information.</p>
            </title>
            <aug>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>174</fpage>
            <lpage>184</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg1806</pubid>
                  <pubid idtype="pmpid" link="fulltext">16485017</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Differential methylation of genes and retrotransposons facilitates shotgun sequencing of the maize genome.</p>
            </title>
            <aug>
               <au>
                  <snm>Rabinowicz</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Schutz</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Dedhia</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Yordan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Parnell</snm>
                  <fnm>LD</fnm>
               </au>
               <au>
                  <snm>Stein</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>McCombie</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>Martienssen</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>1999</pubdate>
            <volume>23</volume>
            <fpage>305</fpage>
            <lpage>308</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/15479</pubid>
                  <pubid idtype="pmpid" link="fulltext">10545948</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>Integration of Cot analysis, DNA cloning, and high-throughput sequencing facilitates genome characterization and gene discovery.</p>
            </title>
            <aug>
               <au>
                  <snm>Peterson</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Schulze</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Sciara</snm>
                  <fnm>EB</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Bowers</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Nagel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Jiang</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Tibbitts</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Wessler</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>795</fpage>
            <lpage>807</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.226102</pubid>
                  <pubid idtype="pmcid">186575</pubid>
                  <pubid idtype="pmpid" link="fulltext">11997346</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>The evolutionary fate and consequences of duplicate genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Lynch</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Conery</snm>
                  <fnm>JS</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2000</pubdate>
            <volume>290</volume>
            <fpage>1151</fpage>
            <lpage>1155</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.290.5494.1151</pubid>
                  <pubid idtype="pmpid" link="fulltext">11073452</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Novel patterns of gene expression in polyploid plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Adams</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>539</fpage>
            <lpage>543</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tig.2005.07.009</pubid>
                  <pubid idtype="pmpid" link="fulltext">16098633</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Gene loss and silencing in <it>Tragopogon miscellus </it>(Asteraceae): comparison of natural and synthetic allotetraploids.</p>
            </title>
            <aug>
               <au>
                  <snm>Buggs</snm>
                  <fnm>RJA</fnm>
               </au>
               <au>
                  <snm>Doust</snm>
                  <fnm>AN</fnm>
               </au>
               <au>
                  <snm>Tate</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Koh</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Feltus</snm>
                  <fnm>FA</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>Soltis</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>Heredity</source>
            <pubdate>2009</pubdate>
            <volume>103</volume>
            <fpage>73</fpage>
            <lpage>81</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/hdy.2009.24</pubid>
                  <pubid idtype="pmpid" link="fulltext">19277058</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Rapid genome change in synthetic polyploids of <it>Brassica </it>and its implications for polyploidy evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Song</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Tang</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Osborn</snm>
                  <fnm>TC</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1995</pubdate>
            <volume>92</volume>
            <fpage>7719</fpage>
            <lpage>7723</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1073/pnas.92.17.7719</pubid>
                  <pubid idtype="pmcid">41217</pubid>
                  <pubid idtype="pmpid">7644483</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Genome evolution in polyploids.</p>
            </title>
            <aug>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Plant Mol Biol</source>
            <pubdate>2000</pubdate>
            <volume>42</volume>
            <fpage>225</fpage>
            <lpage>249</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1023/A:1006392424384</pubid>
                  <pubid idtype="pmpid" link="fulltext">10688139</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Mechanisms of recent genome size variation in flowering plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Devos</snm>
                  <fnm>KM</fnm>
               </au>
            </aug>
            <source>Ann Bot</source>
            <pubdate>2005</pubdate>
            <volume>95</volume>
            <fpage>127</fpage>
            <lpage>132</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/aob/mci008</pubid>
                  <pubid idtype="pmpid">15596462</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Genomic changes in resynthesized <it>Brassica napus </it>and their effect on gene expression and phenotype.</p>
            </title>
            <aug>
               <au>
                  <snm>Gaeta</snm>
                  <fnm>RT</fnm>
               </au>
               <au>
                  <snm>Pires</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Iniguez-Luy</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Leon</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Osborn</snm>
                  <fnm>TC</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2007</pubdate>
            <volume>19</volume>
            <fpage>3403</fpage>
            <lpage>3417</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1105/tpc.107.054346</pubid>
                  <pubid idtype="pmcid">2174891</pubid>
                  <pubid idtype="pmpid" link="fulltext">18024568</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>Sequencing of the <it>Triticum monococcum </it>hardness locus reveals good microcolinearity with rice.</p>
            </title>
            <aug>
               <au>
                  <snm>Chantret</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Cenci</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sabot</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Anderson</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Dubcovsky</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Mol Genet Genomics</source>
            <pubdate>2004</pubdate>
            <volume>271</volume>
            <fpage>377</fpage>
            <lpage>386</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00438-004-0991-y</pubid>
                  <pubid idtype="pmpid" link="fulltext">15014981</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Novel patterns of gene expression in polyploid plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Adams</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>539</fpage>
            <lpage>543</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tig.2005.07.009</pubid>
                  <pubid idtype="pmpid" link="fulltext">16098633</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>A sequence-tagged linkage map of <it>Brassica rapa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Chung</snm>
                  <fnm>TY</fnm>
               </au>
               <au>
                  <snm>King</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>YM</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2006</pubdate>
            <volume>174</volume>
            <fpage>29</fpage>
            <lpage>39</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1534/genetics.106.060152</pubid>
                  <pubid idtype="pmcid">1569789</pubid>
                  <pubid idtype="pmpid">16988107</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>The first generation of a BAC-based physical map of <it>Brassica rapa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Mun</snm>
                  <fnm>J-H</fnm>
               </au>
               <au>
                  <snm>Kwon</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HS</fnm>
               </au>
               <au>
                  <snm>Choi</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Baek</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>SI</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>HI</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>BMC Genomics</source>
            <pubdate>2008</pubdate>
            <volume>9</volume>
            <fpage>280</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/1471-2164-9-280</pubid>
                  <pubid idtype="pmcid">2432078</pubid>
                  <pubid idtype="pmpid" link="fulltext">18549474</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>PipMaker-a web server for aligning two genomic DNA sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Frazer</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Smit</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Riemer</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bouck</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Gibbs</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hardison</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2000</pubdate>
            <volume>10</volume>
            <fpage>577</fpage>
            <lpage>586</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.10.4.577</pubid>
                  <pubid idtype="pmcid">310868</pubid>
                  <pubid idtype="pmpid" link="fulltext">10779500</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>Consed: a graphical tool for sequence finishing.</p>
            </title>
            <aug>
               <au>
                  <snm>Gordon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Abajian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>195</fpage>
            <lpage>202</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521923</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>Base calling of automated sequencer traces using phred. I. Accuracy assessment.</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wendl</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>175</fpage>
            <lpage>185</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521921</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Basecalling of automated sequencer traces using phred. II. Error probabilities.</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>186</fpage>
            <lpage>194</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521922</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>BLAT - the BLAST-like alignment tool.</p>
            </title>
            <aug>
               <au>
                  <snm>Kent</snm>
                  <fnm>WJ</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>656</fpage>
            <lpage>664</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">187518</pubid>
                  <pubid idtype="pmpid" link="fulltext">11932250</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Madden</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Sch&#228;ffer</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acid Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>3389</fpage>
            <lpage>3402</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/nar/25.17.3389</pubid>
                  <pubid idtype="pmcid">146917</pubid>
                  <pubid idtype="pmpid" link="fulltext">9254694</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>RepeatMasker.</p>
            </title>
            <url>http://www.repeatmasker.org/</url>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Munich Information Center for Protein Sequence.</p>
            </title>
            <url>http://mips.gsf.de/proj/plant/webapp/recat/</url>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Automated eukaryotic gene structure annotation using EVidenceModeler and the Program to Assemble Spliced Alignments.</p>
            </title>
            <aug>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Pertea</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Orvis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Buell</snm>
                  <fnm>CR</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2008</pubdate>
            <volume>9</volume>
            <fpage>R7</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/gb-2008-9-1-r7</pubid>
                  <pubid idtype="pmcid">2395244</pubid>
                  <pubid idtype="pmpid" link="fulltext">18190707</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p>FGENESH.</p>
            </title>
            <url>http://www.softberry.com</url>
         </bibl>
         <bibl id="B65">
            <title>
               <p>AUGUSTUS: a web server for gene prediction in eukaryotes that allows user-defined constraints.</p>
            </title>
            <aug>
               <au>
                  <snm>Stanke</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Morgenstern</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Nucleic Acid Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>W465</fpage>
            <lpage>W467</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/nar/gki458</pubid>
                  <pubid idtype="pmcid">1160219</pubid>
                  <pubid idtype="pmpid" link="fulltext">15980513</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>Improving the <it>Arabidopsis </it>genome annotation using maximal transcript alignment assemblies.</p>
            </title>
            <aug>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Mount</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>Hannick</snm>
                  <fnm>LI</fnm>
               </au>
               <au>
                  <snm>Maiti</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ronning</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Rusch</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Town</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Nucleic Acid Res</source>
            <pubdate>2003</pubdate>
            <volume>31</volume>
            <fpage>5654</fpage>
            <lpage>5666</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/nar/gkg770</pubid>
                  <pubid idtype="pmcid">206470</pubid>
                  <pubid idtype="pmpid" link="fulltext">14500829</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>A tool for analyzing and annotating genomic sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kerlavage</snm>
                  <fnm>AR</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1997</pubdate>
            <volume>46</volume>
            <fpage>37</fpage>
            <lpage>45</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/geno.1997.4984</pubid>
                  <pubid idtype="pmpid" link="fulltext">9403056</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>The Pfam protein families database.</p>
            </title>
            <aug>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Cerruti</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Durbin</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Etwiller</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Marshall</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>EL</fnm>
               </au>
            </aug>
            <source>Nucleic Acid Res</source>
            <pubdate>2002</pubdate>
            <volume>30</volume>
            <fpage>276</fpage>
            <lpage>280</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/nar/30.1.276</pubid>
                  <pubid idtype="pmcid">99071</pubid>
                  <pubid idtype="pmpid" link="fulltext">11752314</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>Plant Transposon-encoded Protein Database.</p>
            </title>
            <url>ftp://ftp.tigr.org/pub/data/TransposableElements/transposon_db.pep</url>
         </bibl>
         <bibl id="B70">
            <title>
               <p>A codon-based model of nucleotide substitution for protein-coding DNA sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Goldman</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1994</pubdate>
            <volume>11</volume>
            <fpage>725</fpage>
            <lpage>736</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">7968486</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>PAML 4: phylogenetic analysis by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1586</fpage>
            <lpage>1591</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msm088</pubid>
                  <pubid idtype="pmpid" link="fulltext">17483113</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>Unravelling angiosperm genome evolution by phylogenetic analysis of chromosomal duplication events.</p>
            </title>
            <aug>
               <au>
                  <snm>Bowers</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Rong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2003</pubdate>
            <volume>422</volume>
            <fpage>433</fpage>
            <lpage>438</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01521</pubid>
                  <pubid idtype="pmpid" link="fulltext">12660784</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>Data used in this study.</p>
            </title>
            <url>http://www.brassica-rapa.org/brvsat</url>
         </bibl>
         <bibl id="B74">
            <title>
               <p>The <it>Arabidopsis </it>Information Resource.</p>
            </title>
            <url>http://www.arabidopsis.org/portals/genAnnotation</url>
         </bibl>
      </refgrp>
   </bm>
</art>

