<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art><ui>gb-2011-12-5-r48</ui><ji>1465-6906</ji><fm>
<dochead>Research</dochead>
<bibl>
<title>
<p>A physical map for the <it>Amborella trichopoda </it>genome sheds light on the evolution of angiosperm genome structure</p>
</title>
<aug>
<au id="A1"><snm>Zuccolo</snm><fnm>Andrea</fnm><insr iid="I1"/><email>azuccolo@ag.arizona.edu</email></au>
<au id="A2"><snm>Bowers</snm><mi>E</mi><fnm>John</fnm><insr iid="I2"/><email>jebowers@uga.edu</email></au>
<au id="A3"><snm>Estill</snm><mi>C</mi><fnm>James</fnm><insr iid="I2"/><email>jamesestill@gmail.com</email></au>
<au id="A4"><snm>Xiong</snm><fnm>Zhiyong</fnm><insr iid="I3"/><email>xiongz@missouri.edu</email></au>
<au id="A5"><snm>Luo</snm><fnm>Meizhong</fnm><insr iid="I1"/><insr iid="I4"/><email>mzluo@mail.hzau.edu.cn</email></au>
<au id="A6"><snm>Sebastian</snm><fnm>Aswathy</fnm><insr iid="I1"/><email>aswathyseb@gmail.com</email></au>
<au id="A7"><snm>Goicoechea</snm><mnm>Luis</mnm><fnm>Jos&#233;</fnm><insr iid="I1"/><email>jlgoicoe@ag.arizona.edu</email></au>
<au id="A8"><snm>Collura</snm><fnm>Kristi</fnm><insr iid="I1"/><email>kcollur@Ag.arizona.edu</email></au>
<au id="A9"><snm>Yu</snm><fnm>Yeisoo</fnm><insr iid="I1"/><email>yeisooyu@ag.arizona.edu</email></au>
<au id="A10"><snm>Jiao</snm><fnm>Yuannian</fnm><insr iid="I5"/><email>yxj129@psu.edu</email></au>
<au id="A11"><snm>Duarte</snm><fnm>Jill</fnm><insr iid="I5"/><email>jmr464@psu.edu</email></au>
<au id="A12"><snm>Tang</snm><fnm>Haibao</fnm><insr iid="I2"/><insr iid="I6"/><insr iid="I7"/><email>tanghaibao@gmail.com</email></au>
<au id="A13"><snm>Ayyampalayam</snm><fnm>Saravanaraj</fnm><insr iid="I2"/><email>raj@plantbio.uga.edu</email></au>
<au id="A14"><snm>Rounsley</snm><fnm>Steve</fnm><insr iid="I8"/><insr iid="I9"/><email>rounsley@email.arizona.edu</email></au>
<au id="A15"><snm>Kudrna</snm><fnm>Dave</fnm><insr iid="I1"/><email>dkudrna@ag.arizona.edu</email></au>
<au id="A16"><snm>Paterson</snm><mi>H</mi><fnm>Andrew</fnm><insr iid="I2"/><insr iid="I7"/><email>paterson@plantbio.uga.edu</email></au>
<au id="A17"><snm>Pires</snm><mnm>Chris</mnm><fnm>J</fnm><insr iid="I3"/><email>piresjc@missouri.edu</email></au>
<au id="A18"><snm>Chanderbali</snm><fnm>Andre</fnm><insr iid="I10"/><email>achander@ufl.edu</email></au>
<au id="A19"><snm>Soltis</snm><mi>E</mi><fnm>Douglas</fnm><insr iid="I10"/><email>psoltis@flmnh.ufl.edu</email></au>
<au id="A20"><snm>Chamala</snm><fnm>Srikar</fnm><insr iid="I10"/><email>vaalbert@buffalo.edu</email></au>
<au id="A21"><snm>Barbazuk</snm><fnm>Brad</fnm><insr iid="I10"/><email>bbarbazuk@ufl.edu</email></au>
<au id="A22"><snm>Soltis</snm><mi>S</mi><fnm>Pamela</fnm><insr iid="I11"/><email>psoltis@flmnh.ufl.edu</email></au>
<au id="A23"><snm>Albert</snm><mi>A</mi><fnm>Victor</fnm><insr iid="I12"/><email>vaalbert@buffalo.edu</email></au>
<au id="A24"><snm>Ma</snm><fnm>Hong</fnm><insr iid="I5"/><insr iid="I13"/><email>hxm16@psu.edu</email></au>
<au id="A25"><snm>Mandoli</snm><fnm>Dina</fnm><insr iid="I14"/><email>dina.mandoli@mac.com</email></au>
<au id="A26"><snm>Banks</snm><fnm>Jody</fnm><insr iid="I15"/><email>banksj@purdue.edu</email></au>
<au id="A27"><snm>Carlson</snm><mi>E</mi><fnm>John</fnm><insr iid="I16"/><email>jec16@psu.edu</email></au>
<au id="A28"><snm>Tomkins</snm><fnm>Jeffrey</fnm><insr iid="I17"/><email>jtmkns@clemson.edu</email></au>
<au id="A29"><snm>dePamphilis</snm><mi>W</mi><fnm>Claude</fnm><insr iid="I5"/><email>cwd3@psu.edu</email></au>
<au id="A30"><snm>Wing</snm><mi>A</mi><fnm>Rod</fnm><insr iid="I1"/><email>rwing@ag.arizona.edu</email></au>
<au ca="yes" id="A31"><snm>Leebens-Mack</snm><fnm>Jim</fnm><insr iid="I2"/><email>jleebensmack@plantbio.uga.edu</email></au>
</aug>
<insg>
<ins id="I1"><p>Arizona Genomics Institute, School of Plant Sciences and BIO5 Institute for Collaborative Research, University of Arizona, 1657 East Helen Street, Tucson, AZ 85721, USA</p></ins>
<ins id="I2"><p>Department of Plant Biology, University of Georgia, 4504 Miller Plant Sciences, Athens, GA 30602, USA</p></ins>
<ins id="I3"><p>Department of Biological Sciences, University of Missouri, 371B Life Sciences Center, Columbia, MO 65211, USA</p></ins>
<ins id="I4"><p>College of Life Sciences and Technology, Huazhong Agricultural University, Wuhan, Hubei 430070, China</p></ins>
<ins id="I5"><p>Intercollege Graduate Degree Program in Plant Biology and Institute of Molecular Evolutionary Genetics, Huck Institutes of the Life Sciences, The Pennsylvania State University, 405 Life Sciences Building, University Park, Pennsylvania 16802, USA</p></ins>
<ins id="I6"><p>Department of Plant and Microbiology, College of Natural Resources, University of California, 311 Koshland Hall, Berkeley 94709, CA, USA</p></ins>
<ins id="I7"><p>Plant Genome Mapping Laboratory, University of Georgia, 111 Riverbend Road, Athens, GA 30605, USA</p></ins>
<ins id="I8"><p>School of Plant Sciences and BIO5, University of Arizona, 1657 East Helen Street, Tucson, AZ 85721, USA</p></ins>
<ins id="I9"><p>Dow Agrosciences LLC, 9330 Zionsville Road, Indianapolis, IN 46268, USA</p></ins>
<ins id="I10"><p>Department of Biology, University of Florida, 220 Bartram Hall, Gainesville, FL 32611, USA</p></ins>
<ins id="I11"><p>Florida Museum of Natural History, Museum Road and Newell Drive, University of Florida, Gainesville, FL 32611, USA</p></ins>
<ins id="I12"><p>Department of Biological Sciences, University at Buffalo (SUNY), 637 Hochstetter Hall, Buffalo, NY 14260, USA</p></ins>
<ins id="I13"><p>State Key Laboratory of Genetic Engineering, School of Life Sciences, Institute of Plant Biology, Center for Evolutionary Biology, and Institutes of Biomedical Sciences, Fudan University, 220 Handan Road, Shanghai 200433, China</p></ins>
<ins id="I14"><p>Northern Lights, 4500 NE 40th Street, Seattle WA 98105, USA</p></ins>
<ins id="I15"><p>Department of Botany and Plant Pathology, Purdue University, B028 Whistler Hall, West Lafayette, IN 47906, USA</p></ins>
<ins id="I16"><p>School of Forest Resources, The Pennsylvania State University, 323 Forest Resources Building, University Park, PA 16802, USA</p></ins>
<ins id="I17"><p>Clemson University Genomics Institute, Clemson University, 51 Cherry St, Clemson, NC 29634, USA</p></ins>
</insg>
<source>Genome Biology</source>
<issn>1465-6906</issn>
<pubdate>2011</pubdate>
<volume>12</volume>
<issue>5</issue>
<fpage>R48</fpage>
<url>http://genomebiology.com/2011/12/5/R48</url>
<xrefbib><pubidlist><pubid idtype="doi">10.1186/gb-2011-12-5-r48</pubid><pubid idtype="pmpid">21619600</pubid></pubidlist></xrefbib>
</bibl>
<history><rec><date><day>21</day><month>11</month><year>2010</year></date></rec><revrec><date><day>19</day><month>5</month><year>2011</year></date></revrec><acc><date><day>27</day><month>5</month><year>2011</year></date></acc><pub><date><day>27</day><month>5</month><year>2011</year></date></pub></history>
<cpyrt><year>2011</year><collab>Zuccolo et al.; licensee BioMed Central Ltd.</collab><note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note></cpyrt>
<abs>
<sec>
<st>
<p>Abstract</p>
</st>
<sec>
<st>
<p>Background</p>
</st>
<p>Recent phylogenetic analyses have identified <it>Amborella trichopoda</it>, an understory tree species endemic to the forests of New Caledonia, as sister to a clade including all other known flowering plant species. The <it>Amborella </it>genome is a unique reference for understanding the evolution of angiosperm genomes because it can serve as an outgroup to root comparative analyses. A physical map, BAC end sequences and sample shotgun sequences provide a first view of the 870 Mbp <it>Amborella </it>genome.</p>
</sec>
<sec>
<st>
<p>Results</p>
</st>
<p>Analysis of <it>Amborella </it>BAC ends sequenced from each contig suggests that the density of long terminal repeat retrotransposons is negatively correlated with that of protein coding genes. Syntenic, presumably ancestral, gene blocks were identified in comparisons of the <it>Amborella </it>BAC contigs and the sequenced <it>Arabidopsis thaliana</it>, <it>Populus trichocarpa</it>, <it>Vitis vinifera </it>and <it>Oryza sativa </it>genomes. Parsimony mapping of the loss of synteny corroborates previous analyses suggesting that the rate of structural change has been more rapid on lineages leading to <it>Arabidopsis </it>and <it>Oryza </it>compared with lineages leading to <it>Populus </it>and <it>Vitis</it>. The gamma paleohexiploidy event identified in the <it>Arabidopsis</it>, <it>Populus </it>and <it>Vitis </it>genomes is shown to have occurred after the divergence of all other known angiosperms from the lineage leading to <it>Amborella</it>.</p>
</sec>
<sec>
<st>
<p>Conclusions</p>
</st>
<p>When placed in the context of a physical map, BAC end sequences representing just 5.4% of the <it>Amborella </it>genome have facilitated reconstruction of gene blocks that existed in the last common ancestor of all flowering plants. The <it>Amborella </it>genome is an invaluable reference for inferences concerning the ancestral angiosperm and subsequent genome evolution.</p>
</sec>
</sec>
</abs>
</fm><meta>
<classifications>
<classification id="30010008" subtype="man_spc_id" type="BMC">Evolution</classification>
<classification id="30010010" subtype="man_spc_id" type="BMC">Genome studies</classification>
<classification id="30010019" subtype="man_spc_id" type="BMC">Plant biology</classification>
</classifications>
</meta><bdy>
<sec>
<st>
<p>Background</p>
</st>
<p>The origin and rapid diversification of the angiosperms (flowering plants) were pivotal events in the evolutionary history of Earth's biota. Over the past 130 to 150 million years angiosperms have diversified to include approximately 350,000 species occupying nearly all habitable terrestrial and many aquatic environments. Angiosperms generate the vast majority of human food either directly or indirectly as animal feed, and they account for a huge proportion of land-based photosynthesis and carbon sequestration. Comparative analyses of genome sequences and gene function for a growing number of species are shedding light on how gene and genome duplications have contributed to the diversification within major flowering plant lineages (for example, Rosidae, Asteridae, Monocotyledoneae <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>), but elucidation of the genetic and genomic processes underlying the key innovations associated with the origin of flowering plants (for example, typically bisexual flowers, endosperm formation, double fertilization, ovules with two integuments, seed development within the carpel) requires comparisons between lineages that diverged from the last common ancestor of all extant angiosperms <abbrgrp>
<abbr bid="B2">2</abbr>
<abbr bid="B3">3</abbr>
</abbrgrp>.</p>
<p>Recent phylogenetic analyses have identified <it>Amborella trichopoda</it>, an understory tree or shrub species endemic to the forests of New Caledonia, as the sister species to all other extant angiosperms <abbrgrp>
<abbr bid="B4">4</abbr>
<abbr bid="B5">5</abbr>
<abbr bid="B6">6</abbr>
<abbr bid="B7">7</abbr>
<abbr bid="B8">8</abbr>
</abbrgrp>. <it>Amborella </it>is no more 'ancient' or 'primitive' than any other extant flowering plant species, but comparisons between <it>Amborella </it>and other angiosperms are allowing researchers to triangulate on characteristics of their last common ancestor. Using a similar approach, researchers have used the complete genome sequence of platypus, <it>Ornithorhynchus anatinus</it>, representing the sister group of all other extant mammals, to elucidate mammalian genome evolution <abbrgrp>
<abbr bid="B9">9</abbr>
</abbrgrp>.</p>
<p>Previous comparisons of transcriptome content <abbrgrp>
<abbr bid="B10">10</abbr>
</abbrgrp>, gene expression patterns <abbrgrp>
<abbr bid="B11">11</abbr>
<abbr bid="B12">12</abbr>
<abbr bid="B13">13</abbr>
</abbrgrp>, and gene function <abbrgrp>
<abbr bid="B14">14</abbr>
<abbr bid="B15">15</abbr>
</abbrgrp> between <it>Amborella </it>and other flowering plant species have suggested that much of the floral development program that has been characterized in <it>Arabidopsis</it>, snapdragon and maize existed in the last common ancestor of extant angiosperms. While gene duplications in the MADS-box transcription factor family likely contributed to the earliest floral development regulatory networks <abbrgrp>
<abbr bid="B11">11</abbr>
<abbr bid="B12">12</abbr>
<abbr bid="B16">16</abbr>
<abbr bid="B17">17</abbr>
<abbr bid="B18">18</abbr>
<abbr bid="B19">19</abbr>
</abbrgrp>, it is not clear whether these were single gene duplications or the product of polyploidization. Genome duplications have occurred repeatedly throughout angiosperm history <abbrgrp>
<abbr bid="B20">20</abbr>
<abbr bid="B21">21</abbr>
<abbr bid="B22">22</abbr>
<abbr bid="B23">23</abbr>
</abbrgrp> but there is uncertainty in the timing of polyploidy events relative to the origin of the angiosperms and important innovations in flowering plant history <abbrgrp>
<abbr bid="B24">24</abbr>
</abbrgrp>.</p>
<p>Here we describe a BAC-based draft physical map for <it>A. trichopoda </it>and use BAC end sequences (BESs) to compare the structure of the <it>Amborella </it>genome to representative eudicot (<it>Vitis</it>, <it>Populus </it>and <it>Arabidopsis</it>) and grass (<it>Oryza</it>) genomes. Comparative analyses of sequences for two large contiguous regions (487.3 and 629.7 kb in the <it>Amborella </it>genome) were also performed. In addition we use a large transcriptome assembly to identify BAC ends matching protein-coding sequences <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>. Our aim here is to begin to investigate whether regions of these genomes have remained syntenic throughout angiosperm history, and determine whether ancient genome duplications discovered in eudicot and grass genomes <abbrgrp>
<abbr bid="B26">26</abbr>
<abbr bid="B27">27</abbr>
<abbr bid="B28">28</abbr>
<abbr bid="B29">29</abbr>
</abbrgrp> occurred before or after the divergence of these lineages from the <it>Amborella </it>lineage. In addition, the physical map and sequence analyses establish a framework for future studies of all flowering plant genomes, including the <it>Amborella </it>genome itself.</p>
</sec>
<sec>
<st>
<p>Results and discussion</p>
</st>
<sec>
<st>
<p>BAC library and physical map</p>
</st>
<p>The structure and composition of the 870 Mbp/C <abbrgrp>
<abbr bid="B30">30</abbr>
</abbrgrp>
<it>A. trichopoda </it>genome was investigated through physical mapping of clones from a 5.2 &#215; coverage BAC library. The library was constructed after partial digest of high-molecular-weight DNA with <it>Hin</it>dIII. The library, which comprises 36,684 BAC clones with an estimated average insert size of 123 kb, is available through the Arizona Genomics Institute <abbrgrp>
<abbr bid="B31">31</abbr>
</abbrgrp>. The BAC library was double spotted in high density onto Hybond N+ filters. All 36,684 clones were end-sequenced, and a physical map was constructed after high information content fingerprinting (HICF) <abbrgrp>
<abbr bid="B32">32</abbr>
<abbr bid="B33">33</abbr>
</abbrgrp>. A total of 32,719 fingerprinted BACs was assembled into 3,106 contigs and 1,356 singletons using the program FPC version 7.2 <abbrgrp>
<abbr bid="B34">34</abbr>
</abbrgrp>.</p>
<p>The quality of the physical map was assessed by screening the arrayed library with probes developed for <it>Amborella </it>homologs for eight genes that have been found to be single-copy in sequenced plant genomes <abbrgrp>
<abbr bid="B35">35</abbr>
<abbr bid="B36">36</abbr>
</abbrgrp>. Probes derived from <it>Amborella </it>cDNA clones or PCR amplicons were putative homologs of following single-copy <it>Arabidopsis </it>genes: <it>ASD </it>(At1g14810), <it>DWARF1 </it>(At3g19820), <it>GIGANTEA </it>(At1g22770), <it>LEAFY </it>(At5g61850), a dienelactone hydrolase gene (At2g32520), a cytochrome-C-oxidase-related gene (At4g37830), <it>EIF3K </it>(At4g33250) and a hypothetical protein-coding gene with strong similarity to rice gene Os02g0593400 (At5g63135). All verified positive clones mapped to the same FPC contig for six of the eight probes (Figure S1 in Additional file <supplr sid="S1">1</supplr>). Positive clones for the <it>EIF3K </it>and the hypothetical protein-coding gene probes were each distributed between two FPC contigs and inspection of the HICF bands for these contigs suggests that the genes have been duplicated in the <it>Amborella </it>lineage. In accordance with the expected library coverage, the single copy nuclear gene probes hybridized to 3 to 13 clones (mean 6.9).</p>
<suppl id="S1">
<title>
<p>Additional file 1</p>
</title>
<text>
<p>
<b>Supplemental tables and figures cited with additional details for the physical map and shotgun sequences</b>.</p>
</text>
<file name="gb-2011-12-5-r48-S1.DOC">
   <p>Click here for file</p>
</file>
</suppl>
<p>The correlation between HICF bands and the number of BACs included in each FPC contig was 0.655 for all contigs and 0.917 after removing two contigs derived from the chloroplast and mitochondrial genomes and one contig composed largely of repetitive elements (Figure S2 in Additional file <supplr sid="S1">1</supplr>). We used a calibration of average insert size (123 kb) over the average number of HICF bands per BAC clone (128) to obtain a rough estimate of FPC contig lengths. Of 77 FPC contigs with 39 or more BACs (not including the contigs with the plastome and repetitive elements), estimated lengths ranged from 308 to 1,429 kb.</p>
<p>BAC end sequencing was performed on all fingerprinted BACs producing 69,466 Sanger reads with an average length of 695 bp after quality and vector trimming. This corresponds to 48.25 Mbp, or roughly 5.4% of the <it>Amborella </it>genome. BESs were related to the physical map and used to identify regions of synteny between regions of the <it>Amborella </it>genome and the sequenced <it>Arabidopsis</it>, <it>Populus</it>, <it>Vitis </it>(grape), and <it>Oryza </it>(rice) genomes (see below). In addition, end sequences were used to verify the identity of the three excluded FPC contigs described above. All BESs mapping at least 100 bp apart on the plastid genome <abbrgrp>
<abbr bid="B37">37</abbr>
</abbrgrp> were found in the same FPC contig. This contig included just 532 BACs, indicating very low (1.6%) plastid DNA contamination.</p>
</sec>
<sec>
<st>
<p>Characterization of repeats in BAC end and shotgun sequences</p>
</st>
<p>Repeat composition and frequency in the <it>Amborella </it>genome were characterized through analysis of the BAC end and whole genome survey sequences. Reads were first compared with sequences in Repbase (v.15.08) <abbrgrp>
<abbr bid="B38">38</abbr>
</abbrgrp> using BLASTN <abbrgrp>
<abbr bid="B39">39</abbr>
</abbrgrp>. In order to minimize the effect of divergence between <it>Amborella </it>genes and homologous repeats from other species, we used relaxed BLASTN settings (-q -4 -r 5) to accommodate an estimated 160 million years of sequence divergence since the last common ancestor of extant flowering plants <abbrgrp>
<abbr bid="B8">8</abbr>
<abbr bid="B40">40</abbr>
<abbr bid="B41">41</abbr>
<abbr bid="B42">42</abbr>
</abbrgrp> while maintaining rigorous support for significant hits (E-value threshold was set at 1e-10). All BAC end sequences without significant hits were then compared with the non-redundant protein database in GenBank using BLASTX and an E-value threshold of e-5. Finally, the remaining sequences without matches in Repbase or the GenBank nr database were compared with sequences that did have matches in either database using BLASTN with an E-value threshold of 1.0e-10. We report results both excluding these 'internal' BLAST searches and including them (I). Together these results provide estimates of transposable element (TE) content based on conservative and more comprehensive (and possibly more permissive; I) search strategies.</p>
<p>With the more comprehensive strategy (I), slightly more than half of all the <it>Amborella </it>BESs matched known TE sequences. Not surprisingly, the most highly represented TE class was long terminal repeat (LTR) retrotransposons, accounting for 7.65% (I: 30.01%) of all BESs and 57.5% (I: 56.58%) of all those with hits to Repbase. Hits to Ty1-<it>copia </it>type sequences were slightly more common (3.11%; I: 13.79%) than matches to Ty3-<it>gypsy</it>-like LTRs (3.50%; I: 12.09%); the remaining LTR retrotransposon matches (1.04%; I: 4.13%) were not classified. LINEs also represented a significant fraction of <it>Amborella </it>BAC ends: 2.70% (I: 11.60%) of the total, 19.98% of all the repeats (I: 22.22%). This is noteworthy because LINEs are usually significantly less numerous than LTR retrotransposons in plant genomes <abbrgrp>
<abbr bid="B43">43</abbr>
<abbr bid="B44">44</abbr>
<abbr bid="B45">45</abbr>
<abbr bid="B46">46</abbr>
<abbr bid="B47">47</abbr>
</abbrgrp> with some notable exceptions, such as the element <it>del2 </it>in <it>Lilium speciosum </it>
<abbrgrp>
<abbr bid="B48">48</abbr>
</abbrgrp>. The complete set of DNA TE-related BESs accounts for just 1.63% (I: 4.51%) of the total, and the most represented classes are those of hAT and MuDR elements: 0.92% (I: 2.41%) and 0.49% (I: 1.04%) of the total BESs, respectively. Results from the same analyses replicated on the set of 2,695 random sheared Sanger sequences (Table <tblr tid="T1">1</tblr>) and 648,519 454 reads (Table S1 in Additional file <supplr sid="S1">1</supplr>) are generally in very good agreement with those obtained using BES data.</p>
<tbl id="T1"><title><p>Table 1</p></title><caption><p>Frequencies of BAC end sequences and Sanger shot gun sequences matching sequences in Repbase</p></caption><tblbdy cols="7">
      <r>
         <c ca="left">
            <p>
               <b>Type</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Absolute number in BESs</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Percentage BESs</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Percentage repeats in BESs</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Absolute number in SGSs</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Percentage SGSs</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Percentage repeats in SGSs</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="7">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>
               <b>DNA TEs</b>
            </p>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>hAT</p>
         </c>
         <c ca="center">
            <p>642 (1,671)</p>
         </c>
         <c ca="center">
            <p>0.92 (2.41)</p>
         </c>
         <c ca="center">
            <p>6.84 (4.61)</p>
         </c>
         <c ca="center">
            <p>20 (41)</p>
         </c>
         <c ca="center">
            <p>0.74 (1.52)</p>
         </c>
         <c ca="center">
            <p>5.73 (2.94)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>MuDR</p>
         </c>
         <c ca="center">
            <p>343 (724)</p>
         </c>
         <c ca="center">
            <p>0.49 (1.04)</p>
         </c>
         <c ca="center">
            <p>3.65 (2.00)</p>
         </c>
         <c ca="center">
            <p>7 (30)</p>
         </c>
         <c ca="center">
            <p>0.26 (1.11)</p>
         </c>
         <c ca="center">
            <p>2.00 (2.15)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>CACTA</p>
         </c>
         <c ca="center">
            <p>27 (75)</p>
         </c>
         <c ca="center">
            <p>0.04 (0.11)</p>
         </c>
         <c ca="center">
            <p>0.29 (0.21)</p>
         </c>
         <c ca="center">
            <p>0 (4)</p>
         </c>
         <c ca="center">
            <p>0 (0.15)</p>
         </c>
         <c ca="center">
            <p>0 (0.29)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>Helitrons</p>
         </c>
         <c ca="center">
            <p>12 (69)</p>
         </c>
         <c ca="center">
            <p>0.02 (0.10)</p>
         </c>
         <c ca="center">
            <p>0.13 (0.19)</p>
         </c>
         <c ca="center">
            <p>0 (3)</p>
         </c>
         <c ca="center">
            <p>0 (0.11)</p>
         </c>
         <c ca="center">
            <p>0 (0.22)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>Other</p>
         </c>
         <c ca="center">
            <p>108 (595)</p>
         </c>
         <c ca="center">
            <p>0.15 (0.86)</p>
         </c>
         <c ca="center">
            <p>1.15 (1.64)</p>
         </c>
         <c ca="center">
            <p>1 (24)</p>
         </c>
         <c ca="center">
            <p>0.04 (0.89)</p>
         </c>
         <c ca="center">
            <p>0.29 (1.72)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>Total</p>
         </c>
         <c ca="center">
            <p>1,132 (3,134)</p>
         </c>
         <c ca="center">
            <p>1.63 (4.51)</p>
         </c>
         <c ca="center">
            <p>12.06 (8.64)</p>
         </c>
         <c ca="center">
            <p>28 (102)</p>
         </c>
         <c ca="center">
            <p>1.04 (3.78)</p>
         </c>
         <c ca="center">
            <p>8.02 (7.31)</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>
               <b>Retrotransposons</b>
            </p>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>LTR Ty1-<it>copia</it></p>
         </c>
         <c ca="center">
            <p>2,162 (9,578)</p>
         </c>
         <c ca="center">
            <p>3.11 (13.79)</p>
         </c>
         <c ca="center">
            <p>23.02 (26.42)</p>
         </c>
         <c ca="center">
            <p>64 (314)</p>
         </c>
         <c ca="center">
            <p>2.37 (11.65)</p>
         </c>
         <c ca="center">
            <p>18.34 (22.51)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>LTR Ty3-<it>gypsy</it></p>
         </c>
         <c ca="center">
            <p>2,431 (8,395)</p>
         </c>
         <c ca="center">
            <p>3.50 (12.09)</p>
         </c>
         <c ca="center">
            <p>25.89 (23.15)</p>
         </c>
         <c ca="center">
            <p>129 (377)</p>
         </c>
         <c ca="center">
            <p>4.78 (13.98)</p>
         </c>
         <c ca="center">
            <p>36.96 (27.03)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>LTR not classified</p>
         </c>
         <c ca="center">
            <p>720 (2,868)</p>
         </c>
         <c ca="center">
            <p>1.04 (4.13)</p>
         </c>
         <c ca="center">
            <p>7.67 (7.91)</p>
         </c>
         <c ca="center">
            <p>51 (139)</p>
         </c>
         <c ca="center">
            <p>1.89 (5.16)</p>
         </c>
         <c ca="center">
            <p>14.61 (0.96)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>LINEs</p>
         </c>
         <c ca="center">
            <p>1,876 (8,055)</p>
         </c>
         <c ca="center">
            <p>2.70 (11.60)</p>
         </c>
         <c ca="center">
            <p>19.98 (22.22)</p>
         </c>
         <c ca="center">
            <p>55 (294)</p>
         </c>
         <c ca="center">
            <p>2.04 (10.91)</p>
         </c>
         <c ca="center">
            <p>15.76 (21.08)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>SINEs</p>
         </c>
         <c ca="center">
            <p>11 (183)</p>
         </c>
         <c ca="center">
            <p>0.02 (0.26)</p>
         </c>
         <c ca="center">
            <p>0.12 (0.50)</p>
         </c>
         <c ca="center">
            <p>0 (4)</p>
         </c>
         <c ca="center">
            <p>0 (0.15)</p>
         </c>
         <c ca="center">
            <p>0 (0.29)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>Retro not classified</p>
         </c>
         <c ca="center">
            <p>1,058 (4,046)</p>
         </c>
         <c ca="center">
            <p>1.52 (5.82)</p>
         </c>
         <c ca="center">
            <p>11.27 (11.16)</p>
         </c>
         <c ca="center">
            <p>23 (165)</p>
         </c>
         <c ca="center">
            <p>0.85 (6.12)</p>
         </c>
         <c ca="center">
            <p>6.59 (11.83)</p>
         </c>
      </r>
      <r>
         <c indent="1" ca="left">
            <p>Total</p>
         </c>
         <c ca="center">
            <p>8,258 (33,125)</p>
         </c>
         <c ca="center">
            <p>11.89 (47.69)</p>
         </c>
         <c ca="center">
            <p>87.94 (91.36)</p>
         </c>
         <c ca="center">
            <p>321 (1,293)</p>
         </c>
         <c ca="center">
            <p>11.91 (47.96)</p>
         </c>
         <c ca="center">
            <p>91.98 (92.69)</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>
               <b>Total</b>
            </p>
         </c>
         <c ca="center">
            <p>9,390 (36,259)</p>
         </c>
         <c ca="center">
            <p>13.52 (52.20)</p>
         </c>
         <c ca="center">
            <p>100 (100)</p>
         </c>
         <c ca="center">
            <p>349 (1,395)</p>
         </c>
         <c ca="center">
            <p>12.95 (51.74)</p>
         </c>
         <c ca="center">
            <p>100 (100)</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p>Results in parentheses include Internal BlastN searches. Repbase v.15.08 was used <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. SINE, short interspersed element; SGS, Sanger shot gun sequence.</p>
   </tblfn></tbl>
<p>A <it>de novo </it>search for novel miniature inverted repeat transposable elements (MITEs) overlooked by the similarity search approach was carried out using the pipeline MUST <abbrgrp>
<abbr bid="B49">49</abbr>
</abbrgrp>. The most abundant candidates identified by the pipeline were manually inspected to confirm features typical of MITEs, such as small size, terminal inverted repeats, high A+T nucleotide content and target site duplications. Three putative high-copy MITEs were identified. All of these were small elements (174 to 500 bp) with terminal inverted repeats, target site duplications, and A+T content greater than 65% (Figure S3 in Additional file <supplr sid="S1">1</supplr>). Repeat copy numbers estimated from the BESs and random sheared sequences were extrapolated to obtain genome-wide estimates using the procedure developed by Hawkins <it>et al</it>. <abbrgrp>
<abbr bid="B50">50</abbr>
</abbrgrp>. Copy number ranges from 3,300 copies for MITE_2 to 17,000 copies for MITE_1. The estimates inferred from BESs were generally consistent with those calculated for random sheared reads (with the possible exception of MITE_3; Table <tblr tid="T2">2</tblr>).</p>
<tbl id="T2"><title><p>Table 2</p></title><caption><p>Putatively high-copy MITEs identified in the BESs and Sanger shot gun sequences using MUST pipeline</p></caption><tblbdy cols="8">
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>
               <b>Length</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Inverted repeat length</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>BES hits</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Copy number estimate</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>SGS hits</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Copy number estimate</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>AT%</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="8">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>MITE_1</p>
         </c>
         <c ca="center">
            <p>358</p>
         </c>
         <c ca="center">
            <p>26</p>
         </c>
         <c ca="center">
            <p>542</p>
         </c>
         <c ca="center">
            <p>~17,000</p>
         </c>
         <c ca="center">
            <p>18</p>
         </c>
         <c ca="center">
            <p>~17,200</p>
         </c>
         <c ca="center">
            <p>68.80</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>MITE_2</p>
         </c>
         <c ca="center">
            <p>190</p>
         </c>
         <c ca="center">
            <p>19</p>
         </c>
         <c ca="center">
            <p>140</p>
         </c>
         <c ca="center">
            <p>~3,300</p>
         </c>
         <c ca="center">
            <p>8</p>
         </c>
         <c ca="center">
            <p>~3,100</p>
         </c>
         <c ca="center">
            <p>68.70</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>MITE_3</p>
         </c>
         <c ca="center">
            <p>516</p>
         </c>
         <c ca="center">
            <p>47</p>
         </c>
         <c ca="center">
            <p>394</p>
         </c>
         <c ca="center">
            <p>~17,900</p>
         </c>
         <c ca="center">
            <p>8</p>
         </c>
         <c ca="center">
            <p>~11,300</p>
         </c>
         <c ca="center">
            <p>75.20</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p>Copy number estimates based on procedure of Hawkins <it>et al</it>. <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. SGS, Sanger shot gun sequence.</p>
   </tblfn></tbl>
<p>The conserved reverse transcriptase domains of LTR retrotransposons and LINEs were collected and used to estimate maximum likelihood trees (Figure <figr fid="F1">1</figr>). In the case of LTR retroelements, the trees indicate substitution rate heterogeneity (that is, variation in root-to-tip distances) and no evidence for recent retrotranspositional bursts of single families (that is, short terminal branches). In the case of LINEs, the phylogenetic tree displays very long branches suggestive of an ancient diversification or very rapid substitution rates. As has been described for other plants <abbrgrp>
<abbr bid="B51">51</abbr>
</abbrgrp>, <it>Amborella </it>LINEs exhibit high sequence divergence and extreme heterogeneity.</p>
<fig id="F1"><title><p>Figure 1</p></title><caption><p>Maximum likelihood trees for reverse transcriptase genes classified as Copia-type and Gypsy-type LTR and LINE elements</p></caption><text>
   <p><b>Maximum likelihood trees for reverse transcriptase genes classified as Copia-type and Gypsy-type LTR and LINE elements</b>. <b>(a) </b>Copia-type; <b>(b) </b>Gypsy-type LTRs; <b>(c) </b>Gypsy-type LINEs. The maximum likelihood trees show rate heterogeneity and no recent expansive radiations (that is, short terminal branches). Reverse transcriptase sequences were mined from BAC end sequence set.</p>
</text><graphic file="gb-2011-12-5-r48-1"/></fig>
<p>The <it>Amborella </it>BESs were also searched for microsatellites (that is, simple sequence repeats (SSRs)); for comparison, the search was also conducted on the <it>Amborella </it>random sheared reads and on BESs (from other <it>Hin</it>dIII BAC libraries) from <it>Glycine </it>(soybean) and <it>Oryza rufipogon</it>. In comparison to the other two species, <it>Amborella </it>shows a higher frequency of SSRs, particularly mono- and dinucleotide repeats, with a particularly high frequency of 'AG' dinucleotide microsatellites. The results of SSR analysis in BESs were confirmed by those obtained from the randomly sheared <it>Amborella </it>sequences (Table <tblr tid="T3">3</tblr>).</p>
<tbl id="T3"><title><p>Table 3</p></title><caption><p>Simple sequence repeats identified in BESs and Sanger shot gun sequences</p></caption><tblbdy cols="5">
      <r>
         <c ca="left">
            <p>
               <b>Repeat</b>
            </p>
         </c>
         <c ca="right">
            <p>
               <b><it>Amborella </it>(BES)</b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
         <c ca="right">
            <p>
               <b><it>Amborella </it>(RS)</b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
         <c ca="right">
            <p>
               <b>SoyBean</b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
         <c ca="right">
            <p>
               <b><it>Oryza </it>rufipogon</b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
      </r>
      <r>
         <c cspan="5">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Mono</p>
         </c>
         <c ca="right">
            <p>149.66</p>
         </c>
         <c ca="right">
            <p>152.89</p>
         </c>
         <c ca="right">
            <p>72.74</p>
         </c>
         <c ca="right">
            <p>50.79</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Di</p>
         </c>
         <c ca="right">
            <p>225.03</p>
         </c>
         <c ca="right">
            <p>211.00</p>
         </c>
         <c ca="right">
            <p>77.89</p>
         </c>
         <c ca="right">
            <p>63.94</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Tri</p>
         </c>
         <c ca="right">
            <p>72.49</p>
         </c>
         <c ca="right">
            <p>78.96</p>
         </c>
         <c ca="right">
            <p>110.01</p>
         </c>
         <c ca="right">
            <p>144.06</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Tetra</p>
         </c>
         <c ca="right">
            <p>89.88</p>
         </c>
         <c ca="right">
            <p>90.70</p>
         </c>
         <c ca="right">
            <p>100.67</p>
         </c>
         <c ca="right">
            <p>102.25</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Penta</p>
         </c>
         <c ca="right">
            <p>74.85</p>
         </c>
         <c ca="right">
            <p>89.73</p>
         </c>
         <c ca="right">
            <p>64.54</p>
         </c>
         <c ca="right">
            <p>56.00</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Total</p>
         </c>
         <c ca="right">
            <p>611.92</p>
         </c>
         <c ca="right">
            <p>623.28</p>
         </c>
         <c ca="right">
            <p>425.85</p>
         </c>
         <c ca="right">
            <p>417.04</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p><sup>a</sup>Values are presence per million base pairs. RS, Random sheared</p>
   </tblfn></tbl>
<p>Repeat profiles in the shotgun sequences were also assessed using Tallymer to characterize K-mer frequencies <abbrgrp>
<abbr bid="B52">52</abbr>
</abbrgrp>. The <it>Amborella </it>K-mer frequency profiles were compared with those of <it>Arabidopsis thaliana</it>, <it>Oryza sativa </it>(rice), <it>Sorghum bicolor </it>and <it>Zea mays </it>(maize). While the <it>Amborella </it>genome size is closest to Sorghum's (870 and 740 Mbp/C, respectively), its K-mer frequency profiles were more similar to those of <it>Arabidopsis </it>and rice, with much smaller genome sizes (157 and 490 Mbp/1C, respectively <abbrgrp>
<abbr bid="B53">53</abbr>
</abbrgrp>) (Figure <figr fid="F2">2</figr>).</p>
<fig id="F2"><title><p>Figure 2</p></title><caption><p>K-mer analyses of Sanger shotgun sequences reveal low frequencies of short repeats in the <it>Amborella </it>genome relative to the sorghum and maize genomes</p></caption><text>
   <p><b>K-mer analyses of Sanger shotgun sequences reveal low frequencies of short repeats in the <it>Amborella </it>genome relative to the sorghum and maize genomes</b>.</p>
</text><graphic file="gb-2011-12-5-r48-2"/></fig>
</sec>
<sec>
<st>
<p>Distribution of BESs with matches to protein-coding regions of reference genomes</p>
</st>
<p>All BESs and shotgun sequences were compared to the GenBank nr database using BLASTX <abbrgrp>
<abbr bid="B39">39</abbr>
</abbrgrp> with an e-value threshold of 1e-5. After the removal of sequences similar to TEs, the overall frequencies of sequences finding matches in the protein database were 11.9% and 8.05% for the BES and Sanger shotgun sequences, respectively. For BESs from FPC contigs with ten or more BACs, we found a negative correlation between the frequencies of BESs matching protein-coding genes and LTR retrotransposons (r = -0.423, <it>P </it>&lt; 0.0001). As has been described for other genomes <abbrgrp>
<abbr bid="B54">54</abbr>
<abbr bid="B55">55</abbr>
<abbr bid="B56">56</abbr>
</abbrgrp>, gene density seems to be negatively correlated with retrotranposon density in the <it>Amborella </it>genome.</p>
</sec>
<sec>
<st>
<p>Identification of syntenic blocks between <it>Amborella</it>, <it>Arabidopsis</it>, rice, poplar and grape</p>
</st>
<p>Taking advantage of the availability of a phase I physical map assembly, we mapped the <it>Amborella </it>contigs onto the genomes of <it>A. thaliana</it>, <it>Populus trichocarpa</it>, <it>Vitis vinifera</it>, and <it>O. sativa</it>. We focused on the 77 largest contigs with at least 39 clones. BLAST analyses of BESs were done within the context of their linkages within FPC contigs. All of the contig BESs classified as repeats (see above) were discarded. Those remaining were compared against the four reference genomes. Because of the large evolutionary time that separates <it>Amborella </it>from the other four sequenced genomes <abbrgrp>
<abbr bid="B41">41</abbr>
<abbr bid="B42">42</abbr>
<abbr bid="B57">57</abbr>
</abbrgrp>, the comparisons were carried out at the protein level using tBLASTX; only the best hits were taken into account. <it>Amborella </it>FPC contigs were considered for further analyses if at least two BESs had matches with bit scores greater than 80 (typically a maximum e-value of 1.0E-20 over 100 amino acidic residues) to loci separated by less than 500 kb within one of the four genomes being compared. Positive matches were used as anchors to circumscribe 4-Mbp tracts within the reference genomes and a second, more focused tBLASTX search was performed comparing the BESs with these regions. An e-value threshold of 1.0E-4 was used for the second set of tBLASTX searches and all significant hits were used to identify syntenic regions. We considered a contig as anchored if the contig had at least four positive hits (e-value lower than 1.0e-4) to at least three distinct genes.</p>
<p>Non-repetitive BESs were also compared to a database of 246,196 <it>Amborella </it>cDNA unigene assemblies with lengths greater than 100 bp. These cDNAs were derived from comprehensive sequencing of nine cDNA libraries (Table <tblr tid="T4">4</tblr>) <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>. Sixty-six percent of the non-repetitive BESs matched cDNA sequences in BLASTN searches with an e-value cutoff of 1.0e-10.</p>
<tbl id="T4"><title><p>Table 4</p></title><caption><p>Statistics for cDNA sequences included in multi-library transcriptome assembly of 246,196 unigenes with lengths greater than 100 bp</p></caption><tblbdy cols="5">
      <r>
         <c ca="left">
            <p>
               <b>Tissue - library name</b>
            </p>
         </c>
         <c ca="left">
            <p>
               <b>Sequencing method</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Number of reads</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Unscreened reads</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Total passing bases (MB)</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="5">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Apical meristem - Atr12</p>
         </c>
         <c ca="left">
            <p>454 FLX Titanium</p>
         </c>
         <c ca="center">
            <p>794,746</p>
         </c>
         <c ca="center">
            <p>688,305</p>
         </c>
         <c ca="center">
            <p>201.90</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Male flowers - Atr15</p>
         </c>
         <c ca="left">
            <p>454 FLX Titanium</p>
         </c>
         <c ca="center">
            <p>277,023</p>
         </c>
         <c ca="center">
            <p>255,213</p>
         </c>
         <c ca="center">
            <p>73.49</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Old leaves - Atr14</p>
         </c>
         <c ca="left">
            <p>454 FLX Titanium</p>
         </c>
         <c ca="center">
            <p>280,097</p>
         </c>
         <c ca="center">
            <p>260,563</p>
         </c>
         <c ca="center">
            <p>73.49</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Old stem - Atr13</p>
         </c>
         <c ca="left">
            <p>454 FLX Titanium</p>
         </c>
         <c ca="center">
            <p>259,431</p>
         </c>
         <c ca="center">
            <p>238,156</p>
         </c>
         <c ca="center">
            <p>68.70</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Pre-meiotic female flower buds - Atr10</p>
         </c>
         <c ca="left">
            <p>454 FLX GS</p>
         </c>
         <c ca="center">
            <p>895,000</p>
         </c>
         <c ca="center">
            <p>812,325</p>
         </c>
         <c ca="center">
            <p>176.97</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Pre-meiotic female flower bud - Atr02</p>
         </c>
         <c ca="left">
            <p>Sanger</p>
         </c>
         <c ca="center">
            <p>13,263</p>
         </c>
         <c ca="center">
            <p>13,141</p>
         </c>
         <c ca="center">
            <p>7.17</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Pre-meiotic male flower bud - Atr01</p>
         </c>
         <c ca="left">
            <p>Sanger</p>
         </c>
         <c ca="center">
            <p>25,343</p>
         </c>
         <c ca="center">
            <p>25,006</p>
         </c>
         <c ca="center">
            <p>14.17</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Root - Atr11</p>
         </c>
         <c ca="left">
            <p>454 FLX GS</p>
         </c>
         <c ca="center">
            <p>324,070</p>
         </c>
         <c ca="center">
            <p>300,275</p>
         </c>
         <c ca="center">
            <p>64.88</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Stem - Atr16</p>
         </c>
         <c ca="left">
            <p>454 FLX Titanium</p>
         </c>
         <c ca="center">
            <p>410,098</p>
         </c>
         <c ca="center">
            <p>388,436</p>
         </c>
         <c ca="center">
            <p>120.03</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p>Assemblies and raw data can be downloaded from the Ancestral Angiosperm Genome Project website <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. A BLAST portal for the assembly is also available at the project website.</p>
   </tblfn></tbl>
<p>Using the search strategy described above, 29 large <it>Amborella </it>BAC contigs (&gt;39 BAC clones) showed synteny with at least one of the four sequenced genomes, and nine of these showed synteny with at least one region in all four genomes. All BESs mapping to these syntenic regions also exhibited significant matches to the sequences in the <it>Amborella </it>cDNA assembly (Table <tblr tid="T4">4</tblr>; Table S2 in Additional file <supplr sid="S1">1</supplr>). Whereas 25 of these <it>Amborella </it>BAC contigs mapped to at least one tract in the <it>Vitis </it>genome, 15, 16, and 24 contigs were found to be syntenic with one or more tracts in the <it>Oryza</it>, <it>Arabidopsis</it>, and <it>Populus </it>genomes, respectively (Table S2 in Additional file <supplr sid="S1">1</supplr>). These results provide a novel, albeit coarse, first view of the ancestral genome for all flowering plants and the timing of rearrangements and other structural changes (for example, genome duplications, fractionation, chromosomal fissions and fusions) that have reduced synteny between the monocot and eudicot genomes analyzed here (Figure <figr fid="F3">3</figr>). Parsimony mapping of synteny loss onto a phylogeny consisting of <it>Amborella </it>and the other four species indicates variation in rates of change in genome structure. In agreement with previous studies <abbrgrp>
<abbr bid="B29">29</abbr>
<abbr bid="B45">45</abbr>
</abbrgrp>, <it>Vitis </it>seems to have been the most stable of the sequenced genomes, and the rate of change slowed in the lineage leading to <it>Populus </it>following divergence from the lineage leading to <it>Arabidopsis </it>(Figure <figr fid="F3">3</figr>).</p>
<fig id="F3"><title><p>Figure 3</p></title><caption><p>Variation in rates of structural evolution evident in parsimony mapping of losses of synteny with 29 gene blocks inferred for the last common ancestor of all extant flowering plant lineages</p></caption><text>
   <p><b>Variation in rates of structural evolution evident in parsimony mapping of losses of synteny with 29 gene blocks inferred for the last common ancestor of all extant flowering plant lineages</b>.</p>
</text><graphic file="gb-2011-12-5-r48-3"/></fig>
</sec>
<sec>
<st>
<p>Paleopolyploidy in angiosperm genomes</p>
</st>
<p>Paleopolyploidy events have been well characterized in all four sequenced genomes analyzed here <abbrgrp>
<abbr bid="B29">29</abbr>
<abbr bid="B45">45</abbr>
<abbr bid="B58">58</abbr>
<abbr bid="B59">59</abbr>
<abbr bid="B60">60</abbr>
</abbrgrp>, and the syntenic <it>Amborella </it>FPC contigs described above often match multiple regions in these genomes. The most ancient of these paleopolyploidy events is the so-called &#947; triplication that has been inferred to have occurred before the divergence of the Asteridae (represented by tomato, <it>Solanum lycopersicon</it>) and the Rosidae, including <it>Vitis</it>, <it>Populus </it>and <it>Arabidopsis </it>
<abbrgrp>
<abbr bid="B29">29</abbr>
</abbrgrp>. Given the very incomplete view of the <it>Amborella </it>genome that is available in the BES data, we are not able to assess synteny between <it>Amborella </it>FPC contigs. Nevertheless, comparisons between the <it>Amborella </it>contigs and sets of syntenic blocks in the <it>Vitis </it>genome indicate that the &#947; triplication most likely occurred sometime after the divergence of all other angiosperms from the lineage leading to <it>Amborella</it>.</p>
<p>All BESs were compared to all annotated protein-coding genes in the <it>Vitis </it>genome placed within the context of the pre-triplication ancestral gene blocks and post-triplication syntenic segments identified by Tang <it>et al</it>. <abbrgrp>
<abbr bid="B29">29</abbr>
</abbrgrp>. A total of 328 <it>Amborella </it>FPC contigs had between two and eight genes with significant best BLASTX matches (e-values &#8804;1.0E-6) to <it>Vitis </it>genes corresponding to pre-triplication gene blocks in the ancestral genome. In most of these cases (199 of 328; Additional file <supplr sid="S2">2</supplr>), best hits were distributed between two or three homeologous (that is, post-triplication) syntenic <it>Vitis </it>genome segments. Of the remaining 129 <it>Amborella </it>FPC contigs with BESs showing significant BLASTX hits to a single <it>Vitis </it>subgenome (that is, single copy of a triplicated ancestral block), most (113) included just 2 genes mapping to the ancestral <it>Vitis </it>gene blocks (14 including 3 genes, and 2 including 4 genes) (Additional file <supplr sid="S2">2</supplr>). All 21 FPC contigs with best BLASTX matches to five or more genes within the ancestral <it>Vitis </it>blocks were distributed among two or three post-triplication subgenomes. Complete sequences for the <it>Amborella </it>BAC contigs may reveal more even distribution of segments among <it>Vitis </it>subgenomes, but the results described here suggest that triplication, fractionation and divergence of homeologous segments in the <it>Vitis </it>genome postdate the divergence between lineages leading to <it>Vitis </it>and <it>Amborella </it>(that is, the last common ancestor of all extant angiosperms).</p>
<suppl id="S2">
<title>
<p>Additional file 2</p>
</title>
<text>
<p>
<b>Synteny analysis of <it>Amborella </it>BAC ends and <it>Vitis </it>genes</b>.</p>
</text>
<file name="gb-2011-12-5-r48-S2.XLS">
   <p>Click here for file</p>
</file>
</suppl>
</sec>
<sec>
<st>
<p>Analysis of complete sequences for two <it>Amborella </it>BAC contigs</p>
</st>
<p>Two of the larger (approximately 500 kb) BAC contigs (IDs 431 and 1003) mapping to multiple segments in all four sequenced reference genomes were identified for further investigation. A minimum tiling path was constructed for each contig, and florescence <it>in situ </it>hybridizations were performed to verify that the BACs mapped to a single contiguous region in the <it>Amborella </it>genome (Figure <figr fid="F4">4</figr>). Each BAC in the tiling paths was subcloned and sequenced to 8 &#215; coverage on an ABI 3730xl sequencer. Gaps were closed for each scaffold, and contiguous 487,318 and 629,678 bp phase II sequences were assembled for contigs 431 and 1003, respectively.</p>
<fig id="F4"><title><p>Figure 4</p></title><caption><p>Hybridization of three BAC clones in the minimum tiling paths for contigs 1003 and 431 to mitotic squashes (2<it>n </it>= 26) verifies the FPC assemblies</p></caption><text>
   <p><b>Hybridization of three BAC clones in the minimum tiling paths for contigs 1003 and 431 to mitotic squashes (2<it>n </it>= 26) verifies the FPC assemblies. (a-e) </b>Results for contig 1003; <b>(f-j) </b>results for contig 431. Panels (a) and (f) show all three BAC-FISH probes merged; (e,j) DAPI staining; (b,c,d) show each of three BACs (red, green, white) for contig 1003; (g,h,i) show each of three BACs (red, green, white) for contig 431.</p>
</text><graphic file="gb-2011-12-5-r48-4"/></fig>
<p>The DAWGPAWS suite of scripts was used to organize <it>ab initio </it>gene predictions, BLAST results and the output of repeat identification tools <abbrgrp>
<abbr bid="B61">61</abbr>
<abbr bid="B62">62</abbr>
</abbrgrp>. <it>Ab initio </it>gene predictions were generated using FGENESH <abbrgrp>
<abbr bid="B63">63</abbr>
</abbrgrp>, AUGUSTUS <abbrgrp>
<abbr bid="B64">64</abbr>
</abbrgrp>, SNAP <abbrgrp>
<abbr bid="B65">65</abbr>
</abbrgrp>, GeneID <abbrgrp>
<abbr bid="B66">66</abbr>
</abbrgrp> and GenScan <abbrgrp>
<abbr bid="B67">67</abbr>
</abbrgrp>. In addition, <it>Amborella </it>EST sequences produced by the 454 Titanium platform (2,943,273 reads; total read size of approximately 776 Mbp; average read length of 263.60 bp) and Sanger sequencing (38,147 reads; total read size of approximately 21.3 Mbp; average read length of 559.57 bp) were splice-aligned to the contigs using GMAP (Genomic Mapping and Alignment Program) <abbrgrp>
<abbr bid="B68">68</abbr>
</abbrgrp> with the PASA (Program to Assemble Spliced Alignments) genome annotation tool <abbrgrp>
<abbr bid="B69">69</abbr>
</abbrgrp>. All predictions were manually compared with BLASTX results against gene annotations from <it>Arabidopsis </it>
<abbrgrp>
<abbr bid="B70">70</abbr>
</abbrgrp>, <it>Vitis </it>
<abbrgrp>
<abbr bid="B45">45</abbr>
</abbrgrp>, <it>Z. mays </it>
<abbrgrp>
<abbr bid="B56">56</abbr>
</abbrgrp>, <it>Medicago </it>
<abbrgrp>
<abbr bid="B71">71</abbr>
</abbrgrp>, <it>Oryza </it>
<abbrgrp>
<abbr bid="B72">72</abbr>
<abbr bid="B73">73</abbr>
</abbrgrp>, and <it>Sorghum </it>
<abbrgrp>
<abbr bid="B55">55</abbr>
</abbrgrp> as well as tBLASTx results against the <it>Amborella </it>transcript assemblies. GBrowse views of gene annotations and BLAST results for each contig are available at the Ancestral Angiosperm Genome Project website <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>.</p>
<p>Rigorous assessments of synteny between these <it>Amborella </it>contigs and the aforementioned four angiosperm genomes were performed using LASTZ <abbrgrp>
<abbr bid="B74">74</abbr>
<abbr bid="B75">75</abbr>
</abbrgrp>. Dotplots comparing the <it>Amborella </it>contigs and the <it>Vitis </it>genome show that contigs are syntenic with previously triplicated blocks <abbrgrp>
<abbr bid="B29">29</abbr>
</abbrgrp>. Regions of contig 1003 match genes on syntenic segments of chromosomes 1, 14 and 17 in the <it>Vitis </it>genome (Figure <figr fid="F5">5</figr>) and contig 431 mapped to syntenic portions of <it>Vitis </it>chromosomes 6, 8 and 13 (Figure <figr fid="F6">6</figr>). These findings support the conclusion from the BES analyses suggesting that the &#947; triplication occurred after the first branching event in the phylogeny of extant angiosperms.</p>
<fig id="F5"><title><p>Figure 5</p></title><caption><p>LASTZ dot plots comparing BAC contig 1003 syntenic regions in the grape and rice genomes</p></caption><text>
   <p><b>LASTZ dot plots comparing BAC contig 1003 syntenic regions in the grape and rice genomes</b>. <b>(a) </b>Grape genome; <b>(b) </b>rice genome.</p>
</text><graphic file="gb-2011-12-5-r48-5"/></fig>
<fig id="F6"><title><p>Figure 6</p></title><caption><p>LASTZ dot plots comparing BAC contig 431 syntenic regions in the grape and rice genomes</p></caption><text>
   <p><b>LASTZ dot plots comparing BAC contig 431 syntenic regions in the grape and rice genomes</b>. <b>(a) </b>Grape genome; <b>(b) </b>rice genome.</p>
</text><graphic file="gb-2011-12-5-r48-6"/></fig>
<p>At least two genome duplications (&#961; and &#963;) have been inferred to have occurred within the monocot lineage leading to rice since divergence of monocots and eudicots <abbrgrp>
<abbr bid="B28">28</abbr>
</abbrgrp>. These duplications were evident in comparisons with both <it>Amborella </it>contigs. Regions of contig 1003 were found to be syntenic with portions of rice chromosomes 2 and 4 derived from the &#961; duplication and a portion of chromosome 10 (Figure <figr fid="F5">5</figr>) that is related to these two regions through the earlier &#963; duplication <abbrgrp>
<abbr bid="B28">28</abbr>
</abbrgrp>. The LASTZ analysis of contig 431 revealed synteny with seven regions in the rice genome (Figure <figr fid="F6">6</figr>) and one of the 'putative ancestral regions' (PAR 17) characterized by Tang <it>et al</it>. <abbrgrp>
<abbr bid="B28">28</abbr>
</abbrgrp>. These PARs were defined as regions of synteny between the rice and <it>Vitis </it>genomes. Phylogenetic analyses of genes in <it>Amborella </it>contig 431 and syntenic regions of the rice and <it>Vitis </it>genomes may elucidate the timing of the &#947; triplication and genome duplications evident in synteny analyses of the rice genome relative to the divergence of monocots and eudicots.</p>
</sec>
<sec>
<st>
<p>Phylogenetic analyses of gene families represented in sequenced <it>Amborella </it>contigs</p>
</st>
<p>While the fractionation process has resulted in the loss of most duplicated genes following the ancient polyploidy events evident in the syntenic <it>Vitis </it>and rice segments shown in Figures <figr fid="F5">5</figr> and <figr fid="F6">6</figr>, duplicate <it>Vitis </it>genes have been retained for homologs of three <it>Amborella </it>genes located on contig 431 (Figures <figr fid="F6">6a</figr>). These genes were used to search the PlantTribes gene family database <abbrgrp>
<abbr bid="B35">35</abbr>
</abbrgrp>. The three gene sets identified in the synteny analysis correspond to three gene families (auxin-independent growth promoter, ceramidase and plant uncoupling mitochondrial protein) circumscribed through OrthoMCL clustering <abbrgrp>
<abbr bid="B76">76</abbr>
</abbrgrp> of gene annotations from the available <it>Arabidopsis</it>, <it>Carica </it>(papaya), <it>Populus</it>, <it>Medicago </it>(alfalfa), <it>Glycine</it>, <it>Cucumis </it>(cucumber), <it>Vitis</it>, <it>Mimulus</it>, <it>Oryza</it>, <it>Sorghum</it>, <it>Selaginella </it>(spike moss) and <it>Physcomitrella </it>genomes. Homologous genes sampled from exemplar asterid, ranunculid, non-grass monocot and gymnosperm species were obtained from EST assembly databases <abbrgrp>
<abbr bid="B25">25</abbr>
<abbr bid="B77">77</abbr>
<abbr bid="B78">78</abbr>
</abbrgrp> and were added to each gene family set. Sequences in each gene family set were aligned using MUSCLE <abbrgrp>
<abbr bid="B79">79</abbr>
</abbrgrp>, and RAxML <abbrgrp>
<abbr bid="B80">80</abbr>
</abbrgrp> run with the GTRGAMMA substitution model was used to obtain maximum likelihood estimates of gene trees.</p>
<p>Inspection of the resulting gene trees shows support for the inference drawn from the BAC end sequence analysis. The &#947; triplication (hexaploidy event) clearly occurred after <it>Amborella </it>diverged from other extant angiosperm lineages (Figure <figr fid="F7">7</figr>). The placement of the &#947; triplication with respect to the divergence of monocots and eudocots or core eudicots and the Ranunculales varies among the three gene trees. This incongruence among gene trees is likely due to artifacts associated with substitution rate variation and insufficient taxon sampling. Analyses of additional gene families with broader taxon sampling will be necessary to obtain better resolution for the timing of the &#947; triplication with respect to the divergence of monocot, eudicots, Ranunculales (that is, 'basal' eudicots) and core eudocots.</p>
<fig id="F7"><title><p>Figure 7</p></title><caption><p>Gene trees for auxin-independent growth promoter (<it>AXI1</it>), ceramidase and plant uncoupling mitochondrial protein 1 (<it>PUMP1</it>) gene families</p></caption><text>
   <p><b>Gene trees for auxin-independent growth promoter (<it>AXI1</it>), ceramidase and plant uncoupling mitochondrial protein 1 (<it>PUMP1</it>) gene families. (a) </b>Auxin-independent growth promoter (<it>AXI1</it>); <b>(b) </b>ceramidase; <b>(c) </b>plant uncoupling mitochondrial protein 1 [<it>PUMP1</it>] gene families. The gene trees show divergence of genes on <it>Amborella </it>contig 431 diverging from lineages leading to <it>Vitis </it>&#947; homeologs mapping to syntenic blocks on chromosomes 6, 8 and 13 (shown in red). Genes sampled from major angiosperm lineages are highlighted.</p>
</text><graphic file="gb-2011-12-5-r48-7"/></fig>
</sec>
</sec>
<sec>
<st>
<p>Conclusions</p>
</st>
<p>
<it>A. trichopoda </it>is the sister species to the large clade encompassing all other extant flowering plants. As such, comparative analyses of <it>Amborella </it>and other flowering plants offer a uniquely informative perspective on the most recent common ancestor of all extant angiosperms. The physical map and BAC end sequences described in this study provide a low-resolution view of the <it>Amborella </it>genome. Nonetheless, these data shed light on genomic features of the last common ancestor of flowering plants. Moreover, the <it>Amborella </it>genome provides a unique reference for understanding genome evolution throughout angiosperm history. When placed in the context of the physical map, BESs representing just 5.4% of the <it>Amborella </it>genome allowed reconstruction of ancestral gene blocks in regions represented by 29 BAC contigs and inference of the timing of structural mutations that disrupted these blocks (Figure <figr fid="F3">3</figr>).</p>
<p>Analyses of BESs and BAC contigs also indicate that the ancient &#947; polyploidy event inferred from the <it>Arabidopsis </it>
<abbrgrp>
<abbr bid="B58">58</abbr>
</abbrgrp>, <it>Carica </it>
<abbrgrp>
<abbr bid="B81">81</abbr>
</abbrgrp>, <it>Populus </it>
<abbrgrp>
<abbr bid="B60">60</abbr>
</abbrgrp>, and <it>Vitis </it>
<abbrgrp>
<abbr bid="B45">45</abbr>
</abbrgrp> genomes occurred after the <it>Amborella </it>lineage diverged from the rest of the angiosperms. Therefore, if the origin of angiosperms was associated with a genome duplication as has been hypothesized elsewhere <abbrgrp>
<abbr bid="B16">16</abbr>
<abbr bid="B20">20</abbr>
<abbr bid="B23">23</abbr>
</abbrgrp>, that polyploidy event predated the &#947; event.</p>
</sec>
<sec>
<st>
<p>Materials and methods</p>
</st>
<sec>
<st>
<p>BAC library construction</p>
</st>
<p>Protocols for DNA megabase preparation, library construction, picking and arraying proposed in Luo and Wing <abbrgrp>
<abbr bid="B82">82</abbr>
</abbrgrp> were followed.</p>
</sec>
<sec>
<st>
<p>Fingerprinting</p>
</st>
<p>The SNaPshot fingerprinting technique was adopted <abbrgrp>
<abbr bid="B32">32</abbr>
</abbrgrp> with the modifications described by Kim <it>et al</it>. <abbrgrp>
<abbr bid="B83">83</abbr>
</abbrgrp>. Snapshot reactions were loaded into ABI 3730xl DNA sequencers. Analysis of data for each contig was carried out using the ABI Data Collection Program.</p>
</sec>
<sec>
<st>
<p>Physical map construction</p>
</st>
<p>Fingerprints were assembled into contigs using the program FPC version 7.2 <abbrgrp>
<abbr bid="B34">34</abbr>
</abbrgrp>. The initial assembly was carried out using a Sulston score threshold of e-50 followed by three rounds of dequeuing at the same stringency and auto-merging of contigs at e-21.</p>
</sec>
<sec>
<st>
<p>BAC end extraction and sequencing</p>
</st>
<p>BAC DNA was extracted and end sequenced from 36,684 clones using the methods described by Ammiraju <it>et al</it>. <abbrgrp>
<abbr bid="B83">83</abbr>
<abbr bid="B84">84</abbr>
</abbrgrp>. Sequence quality assessment and trimming were carried out using the programs Phred <abbrgrp>
<abbr bid="B85">85</abbr>
</abbrgrp> and Lucy <abbrgrp>
<abbr bid="B86">86</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Random sheared library</p>
</st>
<p>A random sheared library was constructed as previously described <abbrgrp>
<abbr bid="B87">87</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>cDNA sequencing and assembly</p>
</st>
<p>Additional Sanger ESTs were generated from available male and female flower bud cDNA libraries <abbrgrp>
<abbr bid="B10">10</abbr>
</abbrgrp> (Table <tblr tid="T4">4</tblr>). Libraries for 454 sequencing were constructed from the tissues listed in Table <tblr tid="T4">4</tblr> using the Mint cDNA synthesis kit (Evrogen, Moscow, Russia). Total RNAs for cDNA synthesis were isolated using a combination of CTAB extraction and the RNeasy Plant Mini kit (Qiagen Valencia, CA USA) as previously described for basal angiosperms <abbrgrp>
<abbr bid="B11">11</abbr>
</abbrgrp>. Two rounds of messenger RNA isolation were performed with the Poly(A)Purist&#8482; mRNA Purification Kit (Ambion Inc. Austin, TX USA) according to the manufacturer's recommendation. Contaminant DNA was removed with DNA-free&#8482; (Ambion Inc.) and mRNA quality was verified using a Bioanalyzer (Agilent Inc. Santa Clara, CA, United States). Vector and adaptor sequences were trimmed from 454 Titanium (2,943,273 reads; total read size of approximately 776 Mbp; average read length of 263.60 bp) and Sanger sequences (38,147 reads; total read size of approximately 21.3 Mbp; average read length of 559.57 bp) using seqclean <abbrgrp>
<abbr bid="B88">88</abbr>
</abbrgrp> and assembled using MIRA <abbrgrp>
<abbr bid="B89">89</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Similarity searches, repeat classification and contig anchoring</p>
</st>
<p>Similarity searches were carried out using the programs BLASTN and BLASTX <abbrgrp>
<abbr bid="B39">39</abbr>
</abbrgrp>. BLASTN was run under relaxed settings (-q -4 -r 5) in order to accommodate the evolutionary distance between <it>Amborella </it>and the species included in the repeat databases used; the significance threshold was set at 1e-10. In the case of BLASTX searches the threshold was set at 1e-5 or 1e-4 for the BES synteny analysis. tBLASTX was used to anchor the contigs to the reference genomes (see Results for details).</p>
</sec>
<sec>
<st>
<p>Databases</p>
</st>
<p>The databases used in similarity searches were RepBase version 15.08 <abbrgrp>
<abbr bid="B38">38</abbr>
</abbrgrp>, the GenBank non-redundant (nr) database, and the <it>Oryza</it>, <it>Arabidopsis</it>, <it>Vitis </it>and <it>Populus </it>genome sequences.</p>
</sec>
<sec>
<st>
<p>Validation of repeat searches and MITE identification</p>
</st>
<p>The program MUST <abbrgrp>
<abbr bid="B49">49</abbr>
</abbrgrp> was used for <it>de novo </it>characterization of highly repeated sequences; results were then inspected for the presence of MITE features. Inverted repeats were identified manually parsing the results of dot-plot comparisons made using the program 'Dotter' <abbrgrp>
<abbr bid="B90">90</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Simple sequence repeat searches</p>
</st>
<p>Microsatellites were identified using the program Sputnik <abbrgrp>
<abbr bid="B91">91</abbr>
</abbrgrp>. SSR composition, length and distribution were parsed and analyzed using the tools and the strategy used by Morgante <it>et al</it>. <abbrgrp>
<abbr bid="B92">92</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Fluorescence <it>in situ </it>hybridization</p>
</st>
<p>FPC contigs were validated by hybridizing BAC DNAs to <it>Amborella </it>chromosome squashes. DNA was prepared for BAC mapping to the middle and both ends of BAC contigs 431 and 1003 and used to prepare fluorescently labeled BAC-FISH probes. Chromosome squashes were prepared from root tips and labeled BAC-FISH probes were prepared as described by Xiong <it>et al</it>. <abbrgrp>
<abbr bid="B93">93</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Contig sequencing and annotation</p>
</st>
<p>Minimum tiling paths of seven and six BACs were identified for contigs 1003 and 431, respectively, by the visual inspection of the FPC assemblies. Adjacent clones were chosen based on their reciprocal position and probability value associated to their overlapping fingerprinted bands as shown by FPC. Sequencing of selected minimum tiling path BACs was done to phase II quality as previously described <abbrgrp>
<abbr bid="B73">73</abbr>
</abbrgrp>. Phase II BAC sequences were then assembled into 1003 and 431 contig sequences based on dot plot comparisons and overlap similarity between adjacent clones.</p>
<p>Perl scripts available from the DAWGPAWS package <abbrgrp>
<abbr bid="B61">61</abbr>
<abbr bid="B62">62</abbr>
</abbrgrp> were used to convert computational annotation results from multiple sources into a single GFF3 file for combined evidence annotation in Apollo <abbrgrp>
<abbr bid="B94">94</abbr>
</abbrgrp> and publication in Gbrowse <abbrgrp>
<abbr bid="B95">95</abbr>
</abbrgrp>. <it>Ab initio </it>gene annotation programs used in this process included FGENESH <abbrgrp>
<abbr bid="B63">63</abbr>
</abbrgrp> AUGUSTUS <abbrgrp>
<abbr bid="B64">64</abbr>
</abbrgrp>, SNAP <abbrgrp>
<abbr bid="B65">65</abbr>
</abbrgrp>, GeneID <abbrgrp>
<abbr bid="B66">66</abbr>
</abbrgrp> and GenScan <abbrgrp>
<abbr bid="B67">67</abbr>
</abbrgrp>. Because <it>Amborella</it>-specific gene model parameterizations were not available for these programs, multiple plant models were used for each <it>ab initio </it>program. The sequence of the entire contig was BLASTx (e &lt; 1 &#215; 10<sup>-5</sup>) searched against gene annotations from <it>Arabidopsis </it>
<abbrgrp>
<abbr bid="B70">70</abbr>
</abbrgrp>, <it>Vitis </it>
<abbrgrp>
<abbr bid="B45">45</abbr>
</abbrgrp>, <it>Z. mays </it>
<abbrgrp>
<abbr bid="B56">56</abbr>
</abbrgrp>, <it>Medicago </it>
<abbrgrp>
<abbr bid="B71">71</abbr>
</abbrgrp>, <it>Oryza </it>
<abbrgrp>
<abbr bid="B72">72</abbr>
</abbrgrp>, and <it>Sorghum </it>
<abbrgrp>
<abbr bid="B55">55</abbr>
</abbrgrp> as well as tBLASTx (e &lt; 1 &#215; 10<sup>-5</sup>) searched against a database of comprehensive <it>Amborella </it>transcript assemblies <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>. In addition, <it>Amborella </it>EST sequences (reads and assemblies; Table <tblr tid="T4">4</tblr>) were splice-aligned to the contigs using GMAP (Genomic Mapping and Alignment Program) <abbrgrp>
<abbr bid="B68">68</abbr>
</abbrgrp> with the PASA (Program to Assemble Spliced Alignments) genome annotation tool <abbrgrp>
<abbr bid="B69">69</abbr>
</abbrgrp>. The gene models and BLAST search results were manually combined into gene models using the Apollo genome annotation curation tool <abbrgrp>
<abbr bid="B94">94</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Synteny analysis of sequenced BAC contigs with <it>Vitis </it>and <it>Oryza </it>genomes</p>
</st>
<p>Sequenced <it>Amborella </it>BAC contigs 431 (487,318 bp) and 1003 (629,678 bp) were compared to the International Rice Genome Sequencing Project (IRGSP) rice genome assembly (version 5) and the Genoscope 12 &#215; <it>Vitis </it>genome assembly using LASTZ and default parameters. Prior to LASTZ comparisons, all genomic sequences were masked using NCBI's WindowMasker to remove simple repeats. Significant matches after repeat masking were visualized as dot plots. Gene annotations for the rice and <it>Vitis </it>genomes were obtained from the Rice Annotation Project <abbrgrp>
<abbr bid="B96">96</abbr>
</abbrgrp> and Genoscope <abbrgrp>
<abbr bid="B97">97</abbr>
</abbrgrp>, respectively, and plotted on the vertical axes of the dot plots (Figures <figr fid="F5">5</figr> and <figr fid="F6">6</figr>). FGENESH <abbrgrp>
<abbr bid="B63">63</abbr>
</abbrgrp> annotations for the <it>Amborella </it>contigs were included on the horizontal axes of the dot plots. LASTZ scores were summed for all aligned <it>Amborella</it>-rice or <it>Amborella-Vitis </it>blocks within 100 kb of each other in sequenced genomes. All regions with summed scores &gt;100,000 were considered as syntenic and included in Figures <figr fid="F5">5</figr> and <figr fid="F6">6</figr>.</p>
</sec>
<sec>
<st>
<p>Phylogenetic analysis</p>
</st>
<p>All alignments were carried out using the program 'MUSCLE' <abbrgrp>
<abbr bid="B79">79</abbr>
</abbrgrp> run under default settings. Maximum likelihood analyses were run on aligned DNA and amino acid sequences using RAxML <abbrgrp>
<abbr bid="B80">80</abbr>
</abbrgrp> and the GTRGAMMA nucleotide substitution model.</p>
</sec>
<sec>
<st>
<p>Submission of data to GenBank databases</p>
</st>
<p>BESs (<ext-link ext-link-id="HR616970" ext-link-type="gen">HR616970</ext-link> to <ext-link ext-link-id="HR686434" ext-link-type="gen">HR686434</ext-link>), full-length BAC sequences (<ext-link ext-link-id="AC243594" ext-link-type="gen">AC243594.1</ext-link> to <ext-link ext-link-id="AC243606.1" ext-link-type="gen">AC243606.1</ext-link>), Sanger shotgun sequences (<ext-link ext-link-id="HR614237" ext-link-type="gen">HR614237</ext-link> to <ext-link ext-link-id="HR616931" ext-link-type="gen">HR616931</ext-link>), 454 shotgun sequences (<ext-link ext-link-id="SRP006044" ext-link-type="gen">SRP006044</ext-link>), Sanger ESTs (<ext-link ext-link-id="FD425831.1" ext-link-type="gen">FD425831.1</ext-link> to <ext-link ext-link-id="FD443502.1" ext-link-type="gen">FD443502.1</ext-link>) and 454 cDNA sequences (<ext-link ext-link-id="SRX018174" ext-link-type="gen">SRX018174</ext-link>, <ext-link ext-link-id="SRX018165" ext-link-type="gen">SRX018165</ext-link>, <ext-link ext-link-id="SRX018164" ext-link-type="gen">SRX018164</ext-link>, <ext-link ext-link-id="SRX018163" ext-link-type="gen">SRX018163</ext-link>, <ext-link ext-link-id="SRX018157" ext-link-type="gen">SRX018157</ext-link>, <ext-link ext-link-id="SRX018156" ext-link-type="gen">SRX018156</ext-link>) have been deposited in the appropriate NCBI GenBank sequence databases. All sequences are also available at the Ancestral Angiosperm Genome Project website <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>.</p>
</sec>
</sec>
<sec>
<st>
<p>Abbreviations</p>
</st>
<p>bp: base pair; BAC: bacterial artificial chromosome; BES: BAC end sequence; EST: expressed sequence tag; FISH: fluorescence <it>in situ </it>hybridization; HICF: high information content fingerprinting; LINE: long interspersed element; LTR: long terminal repeat; MITE: miniature inverted repeat transposable element; SSR: simple sequence repeat; TE: transposable element.</p>
</sec>
<sec>
<st>
<p>Authors' contributions</p>
</st>
<p>JLM, AZ, RAW and CWD designed and coordinated the study. The <it>Amborella </it>BAC library was constructed and characterized in the Arizona Genomics Institute (AGI) by DK, YY, KC, JLG, AS and ML. cDNA library production and sequencing was performed by AC at the University of Florida and assemblies were performed by SA. Funding for BAC library construction was obtained by DM, JB, JEC, JT, CWD and RAW. Comparative analyses were performed by AZ, AS, JEB, JCE, JD, HT, SR, AHP, DES, PSS, VAA, HM, CWD and JL-M. Florescence <it>in situ </it>hybridizations were performed by ZX and JCP. BAC contig annotations were performed by JEB, JCE, SC, BB and JLM. AZ and JLM wrote the first draft of the manuscript and all authors contributed to refinement.</p>
</sec>
</bdy><bm>
<ack>
<sec>
<st>
<p>Acknowledgements</p>
</st>
<p>This work was supported with funding from National Science Foundation grants 0208502, 0638595 and 0922742. We also acknowledge helpful comments and suggestions provided by anonymous reviewers.</p>
</sec>
</ack>
<refgrp><bibl id="B1"><title><p>Towards a phylogenetic nomenclature of Tracheophyta.</p></title><aug><au><snm>Cantino</snm><fnm>P</fnm></au><au><snm>Doyle</snm><fnm>JJ</fnm></au><au><snm>Graham</snm><fnm>S</fnm></au><au><snm>Judd</snm><fnm>W</fnm></au><au><snm>Olmstead</snm><fnm>R</fnm></au><au><snm>Soltis</snm><fnm>D</fnm></au><au><snm>Soltis</snm><fnm>P</fnm></au><au><snm>Donoghue</snm><fnm>MJ</fnm></au></aug><source>Taxon</source><pubdate>2007</pubdate><volume>56</volume><fpage>822</fpage><lpage>846</lpage><xrefbib><pubid idtype="doi">10.2307/25065865</pubid></xrefbib></bibl><bibl id="B2"><title><p>A genomics approach to the study of floral developmental genetics: strengths and limitations.</p></title><aug><au><snm>Leebens-Mack</snm><fnm>JH</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Duarte</snm><fnm>J</fnm></au><au><snm>Zheng</snm><fnm>Z</fnm></au><au><snm>Oppenheimer</snm><fnm>D</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au></aug><source>Adv Bot Res</source><pubdate>2006</pubdate><volume>44</volume><fpage>527</fpage><lpage>549</lpage></bibl><bibl id="B3"><title><p>The <it>Amborella </it>genome: an evolutionary reference for plant biology.</p></title><aug><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Albert</snm><fnm>VA</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>Palmer</snm><fnm>JD</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>Carlson</snm><fnm>JE</fnm></au><au><snm>Altman</snm><fnm>N</fnm></au><au><snm>Kim</snm><fnm>S</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Zuccolo</snm><fnm>A</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au></aug><source>Genome Biol</source><pubdate>2008</pubdate><volume>9</volume><fpage>402</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/gb-2008-9-3-402</pubid><pubid idtype="pmcid">2397498</pubid><pubid idtype="pmpid" link="fulltext">18341710</pubid></pubidlist></xrefbib></bibl><bibl id="B4"><title><p>The root of angiosperm phylogeny inferred from duplicate phytochrome genes.</p></title><aug><au><snm>Mathews</snm><fnm>S</fnm></au><au><snm>Donoghue</snm><fnm>MJ</fnm></au></aug><source>Science</source><pubdate>1999</pubdate><volume>286</volume><fpage>947</fpage><lpage>950</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.286.5441.947</pubid><pubid idtype="pmpid" link="fulltext">10542147</pubid></pubidlist></xrefbib></bibl><bibl id="B5"><title><p>The earliest angiosperms: evidence from mitochondrial, plastid and nuclear genomes.</p></title><aug><au><snm>Qiu</snm><fnm>YL</fnm></au><au><snm>Lee</snm><fnm>J</fnm></au><au><snm>Bernasconi-Quadroni</snm><fnm>F</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Zanis</snm><fnm>M</fnm></au><au><snm>Zimmer</snm><fnm>EA</fnm></au><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>Savolainen</snm><fnm>V</fnm></au><au><snm>Chase</snm><fnm>MW</fnm></au></aug><source>Nature</source><pubdate>1999</pubdate><volume>402</volume><fpage>404</fpage><lpage>407</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/46536</pubid><pubid idtype="pmpid" link="fulltext">10586879</pubid></pubidlist></xrefbib></bibl><bibl id="B6"><title><p>Angiosperm phylogeny inferred from multiple genes as a tool for comparative biology.</p></title><aug><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Chase</snm><fnm>MW</fnm></au></aug><source>Nature</source><pubdate>1999</pubdate><volume>402</volume><fpage>402</fpage><lpage>404</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/46528</pubid><pubid idtype="pmpid" link="fulltext">10586878</pubid></pubidlist></xrefbib></bibl><bibl id="B7"><title><p>Analysis of 81 genes from 64 plastid genomes resolves relationships in angiosperms and identifies genome-scale evolutionary patterns.</p></title><aug><au><snm>Jansen</snm><fnm>RK</fnm></au><au><snm>Cai</snm><fnm>Z</fnm></au><au><snm>Raubeson</snm><fnm>LA</fnm></au><au><snm>Daniell</snm><fnm>H</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>Muller</snm><fnm>KF</fnm></au><au><snm>Guisinger-Bellian</snm><fnm>M</fnm></au><au><snm>Haberle</snm><fnm>RC</fnm></au><au><snm>Hansen</snm><fnm>AK</fnm></au><au><snm>Chumley</snm><fnm>TW</fnm></au><au><snm>Lee</snm><fnm>SB</fnm></au><au><snm>Peery</snm><fnm>R</fnm></au><au><snm>McNeal</snm><fnm>JR</fnm></au><au><snm>Kuehl</snm><fnm>JV</fnm></au><au><snm>Boore</snm><fnm>JL</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>19369</fpage><lpage>19374</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0709121104</pubid><pubid idtype="pmcid">2148296</pubid><pubid idtype="pmpid" link="fulltext">18048330</pubid></pubidlist></xrefbib></bibl><bibl id="B8"><title><p>Using plastid genome-scale data to resolve enigmatic relationships among basal angiosperms.</p></title><aug><au><snm>Moore</snm><fnm>MJ</fnm></au><au><snm>Bell</snm><fnm>CD</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>19363</fpage><lpage>19368</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0708072104</pubid><pubid idtype="pmcid">2148295</pubid><pubid idtype="pmpid" link="fulltext">18048334</pubid></pubidlist></xrefbib></bibl><bibl id="B9"><title><p>Genome analysis of the platypus reveals unique signatures of evolution.</p></title><aug><au><snm>Warren</snm><fnm>WC</fnm></au><au><snm>Hillier</snm><fnm>LW</fnm></au><au><snm>Marshall Graves</snm><fnm>JA</fnm></au><au><snm>Birney</snm><fnm>E</fnm></au><au><snm>Ponting</snm><fnm>CP</fnm></au><au><snm>Grutzner</snm><fnm>F</fnm></au><au><snm>Belov</snm><fnm>K</fnm></au><au><snm>Miller</snm><fnm>W</fnm></au><au><snm>Clarke</snm><fnm>L</fnm></au><au><snm>Chinwalla</snm><fnm>AT</fnm></au><au><snm>Yang</snm><fnm>SP</fnm></au><au><snm>Heger</snm><fnm>A</fnm></au><au><snm>Locke</snm><fnm>DP</fnm></au><au><snm>Miethke</snm><fnm>P</fnm></au><au><snm>Waters</snm><fnm>PD</fnm></au><au><snm>Veyrunes</snm><fnm>F</fnm></au><au><snm>Fulton</snm><fnm>L</fnm></au><au><snm>Fulton</snm><fnm>B</fnm></au><au><snm>Graves</snm><fnm>T</fnm></au><au><snm>Wallis</snm><fnm>J</fnm></au><au><snm>Puente</snm><fnm>XS</fnm></au><au><snm>Lopez-Otin</snm><fnm>C</fnm></au><au><snm>Ordonez</snm><fnm>GR</fnm></au><au><snm>Eichler</snm><fnm>EE</fnm></au><au><snm>Chen</snm><fnm>L</fnm></au><au><snm>Cheng</snm><fnm>Z</fnm></au><au><snm>Deakin</snm><fnm>JE</fnm></au><au><snm>Alsop</snm><fnm>A</fnm></au><au><snm>Thompson</snm><fnm>K</fnm></au><au><snm>Kirby</snm><fnm>P</fnm></au><etal/></aug><source>Nature</source><pubdate>2008</pubdate><volume>453</volume><fpage>175</fpage><lpage>183</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06936</pubid><pubid idtype="pmcid">2803040</pubid><pubid idtype="pmpid" link="fulltext">18464734</pubid></pubidlist></xrefbib></bibl><bibl id="B10"><title><p>Floral gene resources from basal angiosperms for comparative genomics research.</p></title><aug><au><snm>Albert</snm><fnm>VA</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Carlson</snm><fnm>JE</fnm></au><au><snm>Farmerie</snm><fnm>WG</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Ilut</snm><fnm>DC</fnm></au><au><snm>Solow</snm><fnm>TM</fnm></au><au><snm>Mueller</snm><fnm>LA</fnm></au><au><snm>Landherr</snm><fnm>LL</fnm></au><au><snm>Hu</snm><fnm>Y</fnm></au><au><snm>Buzgo</snm><fnm>M</fnm></au><au><snm>Kim</snm><fnm>S</fnm></au><au><snm>Yoo</snm><fnm>MJ</fnm></au><au><snm>Frohlich</snm><fnm>MW</fnm></au><au><snm>Perl-Treves</snm><fnm>R</fnm></au><au><snm>Schlarbaum</snm><fnm>SE</fnm></au><au><snm>Bliss</snm><fnm>BJ</fnm></au><au><snm>Zhang</snm><fnm>X</fnm></au><au><snm>Tanksley</snm><fnm>SD</fnm></au><au><snm>Oppenheimer</snm><fnm>DG</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Leebens-Mack</snm><fnm>JH</fnm></au></aug><source>BMC Plant Biol</source><pubdate>2005</pubdate><volume>5</volume><fpage>5</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2229-5-5</pubid><pubid idtype="pmcid">1083416</pubid><pubid idtype="pmpid" link="fulltext">15799777</pubid></pubidlist></xrefbib></bibl><bibl id="B11"><title><p>Expression of floral MADS-box genes in basal angiosperms: implications for the evolution of floral regulators.</p></title><aug><au><snm>Kim</snm><fnm>S</fnm></au><au><snm>Koh</snm><fnm>J</fnm></au><au><snm>Yoo</snm><fnm>MJ</fnm></au><au><snm>Kong</snm><fnm>H</fnm></au><au><snm>Hu</snm><fnm>Y</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au></aug><source>Plant J</source><pubdate>2005</pubdate><volume>43</volume><fpage>724</fpage><lpage>744</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1365-313X.2005.02487.x</pubid><pubid idtype="pmpid" link="fulltext">16115069</pubid></pubidlist></xrefbib></bibl><bibl id="B12"><title><p>The ABC model and its applicability to basal angiosperms.</p></title><aug><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Chanderbali</snm><fnm>AS</fnm></au><au><snm>Kim</snm><fnm>S</fnm></au><au><snm>Buzgo</snm><fnm>M</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au></aug><source>Ann Bot</source><pubdate>2007</pubdate><volume>100</volume><fpage>155</fpage><lpage>163</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/aob/mcm117</pubid><pubid idtype="pmcid">2735328</pubid><pubid idtype="pmpid" link="fulltext">17616563</pubid></pubidlist></xrefbib></bibl><bibl id="B13"><title><p>Insights from ANA-grade angiosperms into the early evolution of CUP-SHAPED COTYLEDON genes.</p></title><aug><au><snm>Vialette-Guiraud</snm><fnm>AC</fnm></au><au><snm>Adam</snm><fnm>H</fnm></au><au><snm>Finet</snm><fnm>C</fnm></au><au><snm>Jasinski</snm><fnm>S</fnm></au><au><snm>Jouannic</snm><fnm>S</fnm></au><au><snm>Scutt</snm><fnm>CP</fnm></au></aug><source>Ann Bot</source><pubdate>2011</pubdate><volume>107</volume><fpage>1511</fpage><lpage>1519</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/aob/mcr024</pubid><pubid idtype="pmpid" link="fulltext">21320879</pubid></pubidlist></xrefbib></bibl><bibl id="B14"><title><p>Functional conservation between CRABS CLAW orthologues from widely diverged angiosperms.</p></title><aug><au><snm>Fourquin</snm><fnm>C</fnm></au><au><snm>Vinauger-Douard</snm><fnm>M</fnm></au><au><snm>Chambrier</snm><fnm>P</fnm></au><au><snm>Berne-Dedieu</snm><fnm>A</fnm></au><au><snm>Scutt</snm><fnm>CP</fnm></au></aug><source>Ann Bot</source><pubdate>2007</pubdate><volume>100</volume><fpage>651</fpage><lpage>657</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/aob/mcm136</pubid><pubid idtype="pmcid">2533609</pubid><pubid idtype="pmpid" link="fulltext">17650514</pubid></pubidlist></xrefbib></bibl><bibl id="B15"><title><p>Evidence that CRABS CLAW and TOUSLED have conserved their roles in carpel development since the ancestor of the extant angiosperms.</p></title><aug><au><snm>Fourquin</snm><fnm>C</fnm></au><au><snm>Vinauger-Douard</snm><fnm>M</fnm></au><au><snm>Fogliani</snm><fnm>B</fnm></au><au><snm>Dumas</snm><fnm>C</fnm></au><au><snm>Scutt</snm><fnm>CP</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2005</pubdate><volume>102</volume><fpage>4649</fpage><lpage>4654</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0409577102</pubid><pubid idtype="pmcid">555504</pubid><pubid idtype="pmpid" link="fulltext">15767586</pubid></pubidlist></xrefbib></bibl><bibl id="B16"><title><p>The evolution of the SEPALLATA subfamily of MADS-box genes: a preangiosperm origin with multiple duplications throughout angiosperm history.</p></title><aug><au><snm>Zahn</snm><fnm>LM</fnm></au><au><snm>Kong</snm><fnm>H</fnm></au><au><snm>Leebens-Mack</snm><fnm>JH</fnm></au><au><snm>Kim</snm><fnm>S</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Landherr</snm><fnm>LL</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au></aug><source>Genetics</source><pubdate>2005</pubdate><volume>169</volume><fpage>2209</fpage><lpage>2223</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1534/genetics.104.037770</pubid><pubid idtype="pmcid">1449606</pubid><pubid idtype="pmpid" link="fulltext">15687268</pubid></pubidlist></xrefbib></bibl><bibl id="B17"><title><p>To B or Not to B a flower: the role of DEFICIENS and GLOBOSA orthologs in the evolution of the angiosperms.</p></title><aug><au><snm>Zahn</snm><fnm>LM</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>Theissen</snm><fnm>G</fnm></au></aug><source>J Hered</source><pubdate>2005</pubdate><volume>96</volume><fpage>225</fpage><lpage>240</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/jhered/esi033</pubid><pubid idtype="pmpid" link="fulltext">15695551</pubid></pubidlist></xrefbib></bibl><bibl id="B18"><title><p>Conservation and divergence in the AGAMOUS subfamily of MADS-box genes: evidence of independent sub- and neofunctionalization events.</p></title><aug><au><snm>Zahn</snm><fnm>LM</fnm></au><au><snm>Leebens-Mack</snm><fnm>JH</fnm></au><au><snm>Arrington</snm><fnm>JM</fnm></au><au><snm>Hu</snm><fnm>Y</fnm></au><au><snm>Landherr</snm><fnm>LL</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Becker</snm><fnm>A</fnm></au><au><snm>Theissen</snm><fnm>G</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au></aug><source>Evol Dev</source><pubdate>2006</pubdate><volume>8</volume><fpage>30</fpage><lpage>45</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1525-142X.2006.05073.x</pubid><pubid idtype="pmpid" link="fulltext">16409381</pubid></pubidlist></xrefbib></bibl><bibl id="B19"><title><p>Evolution of plant MADS box transcription factors: evidence for shifts in selection associated with early angiosperm diversification and concerted gene duplications.</p></title><aug><au><snm>Shan</snm><fnm>H</fnm></au><au><snm>Zahn</snm><fnm>L</fnm></au><au><snm>Guindon</snm><fnm>S</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Kong</snm><fnm>H</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2009</pubdate><volume>26</volume><fpage>2229</fpage><lpage>2244</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msp129</pubid><pubid idtype="pmpid" link="fulltext">19578156</pubid></pubidlist></xrefbib></bibl><bibl id="B20"><title><p>Widespread genome duplications throughout the history of flowering plants.</p></title><aug><au><snm>Cui</snm><fnm>L</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Leebens-Mack</snm><fnm>JH</fnm></au><au><snm>Lindsay</snm><fnm>BG</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Doyle</snm><fnm>JJ</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au><au><snm>Carlson</snm><fnm>JE</fnm></au><au><snm>Arumuganathan</snm><fnm>K</fnm></au><au><snm>Barakat</snm><fnm>A</fnm></au><au><snm>Albert</snm><fnm>VA</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au></aug><source>Genome Res</source><pubdate>2006</pubdate><volume>16</volume><fpage>738</fpage><lpage>749</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.4825606</pubid><pubid idtype="pmcid">1479859</pubid><pubid idtype="pmpid" link="fulltext">16702410</pubid></pubidlist></xrefbib></bibl><bibl id="B21"><title><p>The flowering world: a tale of duplications.</p></title><aug><au><snm>Van de Peer</snm><fnm>Y</fnm></au><au><snm>Fawcett</snm><fnm>JA</fnm></au><au><snm>Proost</snm><fnm>S</fnm></au><au><snm>Sterck</snm><fnm>L</fnm></au><au><snm>Vandepoele</snm><fnm>K</fnm></au></aug><source>Trends Plant Sci</source><pubdate>2009</pubdate><volume>14</volume><fpage>680</fpage><lpage>688</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.tplants.2009.09.001</pubid><pubid idtype="pmpid" link="fulltext">19818673</pubid></pubidlist></xrefbib></bibl><bibl id="B22"><title><p>The frequency of polyploid speciation in vascular plants.</p></title><aug><au><snm>Wood</snm><fnm>TE</fnm></au><au><snm>Takebayashi</snm><fnm>N</fnm></au><au><snm>Barker</snm><fnm>MS</fnm></au><au><snm>Mayrose</snm><fnm>I</fnm></au><au><snm>Greenspoon</snm><fnm>PB</fnm></au><au><snm>Rieseberg</snm><fnm>LH</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2009</pubdate><volume>106</volume><fpage>13875</fpage><lpage>13879</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0811575106</pubid><pubid idtype="pmcid">2728988</pubid><pubid idtype="pmpid" link="fulltext">19667210</pubid></pubidlist></xrefbib></bibl><bibl id="B23"><title><p>Genome duplication and the origin of angiosperms.</p></title><aug><au><snm>De Bodt</snm><fnm>S</fnm></au><au><snm>Maere</snm><fnm>S</fnm></au><au><snm>Van de Peer</snm><fnm>Y</fnm></au></aug><source>Trends Ecol Evol</source><pubdate>2005</pubdate><volume>20</volume><fpage>591</fpage><lpage>597</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.tree.2005.07.008</pubid><pubid idtype="pmpid" link="fulltext">16701441</pubid></pubidlist></xrefbib></bibl><bibl id="B24"><title><p>Polyploidy and angiosperm diversification.</p></title><aug><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Albert</snm><fnm>VA</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>Bell</snm><fnm>CD</fnm></au><au><snm>Paterson</snm><fnm>AH</fnm></au><au><snm>Zheng</snm><fnm>C</fnm></au><au><snm>Sankoff</snm><fnm>D</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Soltis</snm><fnm>PS</fnm></au></aug><source>Am J Bot</source><pubdate>2009</pubdate><volume>96</volume><fpage>336</fpage><lpage>348</lpage><xrefbib><pubidlist><pubid idtype="doi">10.3732/ajb.0800079</pubid><pubid idtype="pmpid">21628192</pubid></pubidlist></xrefbib></bibl><bibl id="B25"><title><p>Ancestral Angiosperm Genome Project.</p></title><url>http://ancangio.uga.edu/</url></bibl><bibl id="B26"><title><p>Finding and comparing syntenic regions among <it>Arabidopsis </it>and the outgroups papaya, poplar, and grape: CoGe with rosids.</p></title><aug><au><snm>Lyons</snm><fnm>E</fnm></au><au><snm>Pedersen</snm><fnm>B</fnm></au><au><snm>Kane</snm><fnm>J</fnm></au><au><snm>Alam</snm><fnm>M</fnm></au><au><snm>Ming</snm><fnm>R</fnm></au><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Bowers</snm><fnm>J</fnm></au><au><snm>Paterson</snm><fnm>A</fnm></au><au><snm>Lisch</snm><fnm>D</fnm></au><au><snm>Freeling</snm><fnm>M</fnm></au></aug><source>Plant Physiol</source><pubdate>2008</pubdate><volume>148</volume><fpage>1772</fpage><lpage>1781</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1104/pp.108.124867</pubid><pubid idtype="pmcid">2593677</pubid><pubid idtype="pmpid" link="fulltext">18952863</pubid></pubidlist></xrefbib></bibl><bibl id="B27"><title><p>Synteny and collinearity in plant genomes.</p></title><aug><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Ming</snm><fnm>R</fnm></au><au><snm>Alam</snm><fnm>M</fnm></au><au><snm>Paterson</snm><fnm>AH</fnm></au></aug><source>Science</source><pubdate>2008</pubdate><volume>320</volume><fpage>486</fpage><lpage>488</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1153917</pubid><pubid idtype="pmpid" link="fulltext">18436778</pubid></pubidlist></xrefbib></bibl><bibl id="B28"><title><p>Angiosperm genome comparisons reveal early polyploidy in the monocot lineage.</p></title><aug><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Paterson</snm><fnm>AH</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2010</pubdate><volume>107</volume><fpage>472</fpage><lpage>477</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0908007107</pubid><pubid idtype="pmcid">2806719</pubid><pubid idtype="pmpid" link="fulltext">19966307</pubid></pubidlist></xrefbib></bibl><bibl id="B29"><title><p>Unraveling ancient hexaploidy through multiply-aligned angiosperm gene maps.</p></title><aug><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Ming</snm><fnm>R</fnm></au><au><snm>Alam</snm><fnm>M</fnm></au><au><snm>Paterson</snm><fnm>AH</fnm></au></aug><source>Genome Res</source><pubdate>2008</pubdate><volume>18</volume><fpage>1944</fpage><lpage>1954</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.080978.108</pubid><pubid idtype="pmcid">2593578</pubid><pubid idtype="pmpid" link="fulltext">18832442</pubid></pubidlist></xrefbib></bibl><bibl id="B30"><title><p>DNA C-values in seven families fill phylogenetic gapsin the basal angiosperms.</p></title><aug><au><snm>Leitch</snm><fnm>I</fnm></au><au><snm>Hanson</snm><fnm>L</fnm></au></aug><source>Bot J Linn Soc</source><pubdate>2002</pubdate><volume>140</volume><fpage>175</fpage><lpage>179</lpage><xrefbib><pubid idtype="doi">10.1046/j.1095-8339.2002.00096.x</pubid></xrefbib></bibl><bibl id="B31"><title><p>Arizona Genome Institute.</p></title><url>http://www.genome.arizona.edu/orders/direct.html?library=AT_SBa</url></bibl><bibl id="B32"><title><p>High-throughput fingerprinting of bacterial artificial chromosomes using the snapshot labeling kit and sizing of restriction fragments by capillary electrophoresis.</p></title><aug><au><snm>Luo</snm><fnm>MC</fnm></au><au><snm>Thomas</snm><fnm>C</fnm></au><au><snm>You</snm><fnm>FM</fnm></au><au><snm>Hsiao</snm><fnm>J</fnm></au><au><snm>Ouyang</snm><fnm>S</fnm></au><au><snm>Buell</snm><fnm>CR</fnm></au><au><snm>Malandro</snm><fnm>M</fnm></au><au><snm>McGuire</snm><fnm>PE</fnm></au><au><snm>Anderson</snm><fnm>OD</fnm></au><au><snm>Dvorak</snm><fnm>J</fnm></au></aug><source>Genomics</source><pubdate>2003</pubdate><volume>82</volume><fpage>378</fpage><lpage>389</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/S0888-7543(03)00128-9</pubid><pubid idtype="pmpid" link="fulltext">12906862</pubid></pubidlist></xrefbib></bibl><bibl id="B33"><title><p>Whole-genome validation of high-information-content fingerprinting.</p></title><aug><au><snm>Nelson</snm><fnm>WM</fnm></au><au><snm>Bharti</snm><fnm>AK</fnm></au><au><snm>Butler</snm><fnm>E</fnm></au><au><snm>Wei</snm><fnm>F</fnm></au><au><snm>Fuks</snm><fnm>G</fnm></au><au><snm>Kim</snm><fnm>H</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au><au><snm>Messing</snm><fnm>J</fnm></au><au><snm>Soderlund</snm><fnm>C</fnm></au></aug><source>Plant Physiol</source><pubdate>2005</pubdate><volume>139</volume><fpage>27</fpage><lpage>38</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1104/pp.105.061978</pubid><pubid idtype="pmcid">1203355</pubid><pubid idtype="pmpid" link="fulltext">16166258</pubid></pubidlist></xrefbib></bibl><bibl id="B34"><title><p>Contigs built with fingerprints, markers, and FPC V4.7.</p></title><aug><au><snm>Soderlund</snm><fnm>C</fnm></au><au><snm>Humphray</snm><fnm>S</fnm></au><au><snm>Dunham</snm><fnm>A</fnm></au><au><snm>French</snm><fnm>L</fnm></au></aug><source>Genome Res</source><pubdate>2000</pubdate><volume>10</volume><fpage>1772</fpage><lpage>1787</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.GR-1375R</pubid><pubid idtype="pmcid">310962</pubid><pubid idtype="pmpid" link="fulltext">11076862</pubid></pubidlist></xrefbib></bibl><bibl id="B35"><title><p>PlantTribes: a gene and gene family resource for comparative genomics in plants.</p></title><aug><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>Muller</snm><fnm>KF</fnm></au><au><snm>Field</snm><fnm>D</fnm></au><au><snm>Altman</snm><fnm>NS</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2008</pubdate><volume>36</volume><fpage>D970</fpage><lpage>976</lpage><xrefbib><pubidlist><pubid idtype="pmcid">2238917</pubid><pubid idtype="pmpid" link="fulltext">18073194</pubid></pubidlist></xrefbib></bibl><bibl id="B36"><title><p>Identification of shared single copy nuclear genes in <it>Arabidopsis</it>, Populus, Vitis and <it>Oryza </it>and their phylogenetic utility across various taxonomic levels.</p></title><aug><au><snm>Duarte</snm><fnm>JM</fnm></au><au><snm>Wall</snm><fnm>PK</fnm></au><au><snm>Edger</snm><fnm>PP</fnm></au><au><snm>Landherr</snm><fnm>LL</fnm></au><au><snm>Ma</snm><fnm>H</fnm></au><au><snm>Pires</snm><fnm>JC</fnm></au><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au></aug><source>BMC Evol Biol</source><pubdate>2010</pubdate><volume>10</volume><fpage>61</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2148-10-61</pubid><pubid idtype="pmcid">2848037</pubid><pubid idtype="pmpid" link="fulltext">20181251</pubid></pubidlist></xrefbib></bibl><bibl id="B37"><title><p>Analysis of the <it>Amborella </it>trichopoda chloroplast genome sequence suggests that amborella is not a basal angiosperm.</p></title><aug><au><snm>Goremykin</snm><fnm>VV</fnm></au><au><snm>Hirsch-Ernst</snm><fnm>KI</fnm></au><au><snm>Wolfl</snm><fnm>S</fnm></au><au><snm>Hellwig</snm><fnm>FH</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2003</pubdate><volume>20</volume><fpage>1499</fpage><lpage>1505</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msg159</pubid><pubid idtype="pmpid" link="fulltext">12832641</pubid></pubidlist></xrefbib></bibl><bibl id="B38"><title><p>Repbase Update, a database of eukaryotic repetitive elements.</p></title><aug><au><snm>Jurka</snm><fnm>J</fnm></au><au><snm>Kapitonov</snm><fnm>VV</fnm></au><au><snm>Pavlicek</snm><fnm>A</fnm></au><au><snm>Klonowski</snm><fnm>P</fnm></au><au><snm>Kohany</snm><fnm>O</fnm></au><au><snm>Walichiewicz</snm><fnm>J</fnm></au></aug><source>Cytogenet Genome Res</source><pubdate>2005</pubdate><volume>110</volume><fpage>462</fpage><lpage>467</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1159/000084979</pubid><pubid idtype="pmpid" link="fulltext">16093699</pubid></pubidlist></xrefbib></bibl><bibl id="B39"><title><p>Basic local alignment search tool.</p></title><aug><au><snm>Altschul</snm><fnm>SF</fnm></au><au><snm>Gish</snm><fnm>W</fnm></au><au><snm>Miller</snm><fnm>W</fnm></au><au><snm>Myers</snm><fnm>EW</fnm></au><au><snm>Lipman</snm><fnm>DJ</fnm></au></aug><source>J Mol Biol</source><pubdate>1990</pubdate><volume>215</volume><fpage>403</fpage><lpage>410</lpage><xrefbib><pubid idtype="pmpid">2231712</pubid></xrefbib></bibl><bibl id="B40"><title><p>Identifying the basal angiosperm node in chloroplast genome phylogenies: sampling one's way out of the Felsenstein zone.</p></title><aug><au><snm>Leebens-Mack</snm><fnm>J</fnm></au><au><snm>Raubeson</snm><fnm>LA</fnm></au><au><snm>Cui</snm><fnm>L</fnm></au><au><snm>Kuehl</snm><fnm>JV</fnm></au><au><snm>Fourcade</snm><fnm>MH</fnm></au><au><snm>Chumley</snm><fnm>TW</fnm></au><au><snm>Boore</snm><fnm>JL</fnm></au><au><snm>Jansen</snm><fnm>RK</fnm></au><au><snm>dePamphilis</snm><fnm>CW</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2005</pubdate><volume>22</volume><fpage>1948</fpage><lpage>1963</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msi191</pubid><pubid idtype="pmpid" link="fulltext">15944438</pubid></pubidlist></xrefbib></bibl><bibl id="B41"><title><p>Using fossils to break long branches in molecular dating: a comparison of relaxed clocks applied to the origin of angiosperms.</p></title><aug><au><snm>Magallon</snm><fnm>S</fnm></au></aug><source>Syst Biol</source><pubdate>2010</pubdate><volume>59</volume><fpage>384</fpage><lpage>399</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/sysbio/syq027</pubid><pubid idtype="pmpid" link="fulltext">20538759</pubid></pubidlist></xrefbib></bibl><bibl id="B42"><title><p>An uncorrelated relaxed-clock analysis suggests an earlier origin for flowering plants.</p></title><aug><au><snm>Smith</snm><fnm>SA</fnm></au><au><snm>Beaulieu</snm><fnm>JM</fnm></au><au><snm>Donoghue</snm><fnm>MJ</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2010</pubdate><volume>107</volume><fpage>5897</fpage><lpage>5902</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.1001225107</pubid><pubid idtype="pmcid">2851901</pubid><pubid idtype="pmpid" link="fulltext">20304790</pubid></pubidlist></xrefbib></bibl><bibl id="B43"><title><p>Exceptional diversity, non-random distribution, and rapid evolution of retroelements in the B73 maize genome.</p></title><aug><au><snm>Baucom</snm><fnm>RS</fnm></au><au><snm>Estill</snm><fnm>JC</fnm></au><au><snm>Chaparro</snm><fnm>C</fnm></au><au><snm>Upshaw</snm><fnm>N</fnm></au><au><snm>Jogi</snm><fnm>A</fnm></au><au><snm>Deragon</snm><fnm>JM</fnm></au><au><snm>Westerman</snm><fnm>RP</fnm></au><au><snm>Sanmiguel</snm><fnm>PJ</fnm></au><au><snm>Bennetzen</snm><fnm>JL</fnm></au></aug><source>PLoS Genet</source><pubdate>2009</pubdate><volume>5</volume><fpage>e1000732</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pgen.1000732</pubid><pubid idtype="pmcid">2774510</pubid><pubid idtype="pmpid" link="fulltext">19936065</pubid></pubidlist></xrefbib></bibl><bibl id="B44"><title><p>The map-based sequence of the rice genome.</p></title><aug><au><cnm>International Rice Genome Sequencing Project</cnm></au></aug><source>Nature</source><pubdate>2005</pubdate><volume>436</volume><fpage>793</fpage><lpage>800</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature03895</pubid><pubid idtype="pmpid" link="fulltext">16100779</pubid></pubidlist></xrefbib></bibl><bibl id="B45"><title><p>The grapevine genome sequence suggests ancestral hexaploidization in major angiosperm phyla.</p></title><aug><au><snm>Jaillon</snm><fnm>O</fnm></au><au><snm>Aury</snm><fnm>JM</fnm></au><au><snm>Noel</snm><fnm>B</fnm></au><au><snm>Policriti</snm><fnm>A</fnm></au><au><snm>Clepet</snm><fnm>C</fnm></au><au><snm>Casagrande</snm><fnm>A</fnm></au><au><snm>Choisne</snm><fnm>N</fnm></au><au><snm>Aubourg</snm><fnm>S</fnm></au><au><snm>Vitulo</snm><fnm>N</fnm></au><au><snm>Jubin</snm><fnm>C</fnm></au><au><snm>Vezzi</snm><fnm>A</fnm></au><au><snm>Legeai</snm><fnm>F</fnm></au><au><snm>Hugueney</snm><fnm>P</fnm></au><au><snm>Dasilva</snm><fnm>C</fnm></au><au><snm>Horner</snm><fnm>D</fnm></au><au><snm>Micac</snm><fnm>E</fnm></au><au><snm>Jublot</snm><fnm>D</fnm></au><au><snm>Poulain</snm><fnm>J</fnm></au><au><snm>Bruyere</snm><fnm>C</fnm></au><au><snm>Billault</snm><fnm>A</fnm></au><au><snm>Segurens</snm><fnm>B</fnm></au><au><snm>Gouyvenoux</snm><fnm>M</fnm></au><au><snm>Ugarte</snm><fnm>E</fnm></au><au><snm>Cattonaro</snm><fnm>F</fnm></au><au><snm>Anthouard</snm><fnm>V</fnm></au><au><snm>Vico</snm><fnm>V</fnm></au><au><snm>Del Fabbro</snm><fnm>C</fnm></au><au><snm>Alaux</snm><fnm>M</fnm></au><au><snm>Di Gaspero</snm><fnm>G</fnm></au><au><snm>Dumas</snm><fnm>V</fnm></au><etal/></aug><source>Nature</source><pubdate>2007</pubdate><volume>449</volume><fpage>463</fpage><lpage>467</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06148</pubid><pubid idtype="pmpid" link="fulltext">17721507</pubid></pubidlist></xrefbib></bibl><bibl id="B46"><title><p>Genome sequence of the palaeopolyploid soybean.</p></title><aug><au><snm>Schmutz</snm><fnm>J</fnm></au><au><snm>Cannon</snm><fnm>SB</fnm></au><au><snm>Schlueter</snm><fnm>J</fnm></au><au><snm>Ma</snm><fnm>J</fnm></au><au><snm>Mitros</snm><fnm>T</fnm></au><au><snm>Nelson</snm><fnm>W</fnm></au><au><snm>Hyten</snm><fnm>DL</fnm></au><au><snm>Song</snm><fnm>Q</fnm></au><au><snm>Thelen</snm><fnm>JJ</fnm></au><au><snm>Cheng</snm><fnm>J</fnm></au><au><snm>D</snm><fnm>Xu</fnm></au><au><snm>Hellsten</snm><fnm>U</fnm></au><au><snm>May</snm><fnm>GD</fnm></au><au><snm>Yu</snm><fnm>Y</fnm></au><au><snm>Sakurai</snm><fnm>T</fnm></au><au><snm>Umezawa</snm><fnm>T</fnm></au><au><snm>Bhattacharyya</snm><fnm>MK</fnm></au><au><snm>Sandhu</snm><fnm>D</fnm></au><au><snm>Valliyodan</snm><fnm>B</fnm></au><au><snm>Lindquist</snm><fnm>E</fnm></au><au><snm>Peto</snm><fnm>M</fnm></au><au><snm>Grant</snm><fnm>D</fnm></au><au><snm>Shu</snm><fnm>S</fnm></au><au><snm>Goodstein</snm><fnm>D</fnm></au><au><snm>Barry</snm><fnm>K</fnm></au><au><snm>Futrell-Griggs</snm><fnm>M</fnm></au><au><snm>Abernathy</snm><fnm>B</fnm></au><au><snm>Du</snm><fnm>J</fnm></au><au><snm>Tian</snm><fnm>Z</fnm></au><au><snm>Zhu</snm><fnm>L</fnm></au><etal/></aug><source>Nature</source><pubdate>2010</pubdate><volume>463</volume><fpage>178</fpage><lpage>183</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature08670</pubid><pubid idtype="pmpid" link="fulltext">20075913</pubid></pubidlist></xrefbib></bibl><bibl id="B47"><title><p>LINEs and gypsy-like retrotransposons in Hordeum species.</p></title><aug><au><snm>Vershinin</snm><fnm>AV</fnm></au><au><snm>Druka</snm><fnm>A</fnm></au><au><snm>Alkhimova</snm><fnm>AG</fnm></au><au><snm>Kleinhofs</snm><fnm>A</fnm></au><au><snm>Heslop-Harrison</snm><fnm>JS</fnm></au></aug><source>Plant Mol Biol</source><pubdate>2002</pubdate><volume>49</volume><fpage>1</fpage><lpage>14</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1023/A:1014469830680</pubid><pubid idtype="pmpid" link="fulltext">12008894</pubid></pubidlist></xrefbib></bibl><bibl id="B48"><title><p>An abundant LINE-like element amplified in the genome of Lilium speciosum.</p></title><aug><au><snm>Leeton</snm><fnm>PR</fnm></au><au><snm>Smyth</snm><fnm>DR</fnm></au></aug><source>Mol Gen Genet</source><pubdate>1993</pubdate><volume>237</volume><fpage>97</fpage><lpage>104</lpage><xrefbib><pubid idtype="pmpid">7681139</pubid></xrefbib></bibl><bibl id="B49"><title><p>MUST: a system for identification of miniature inverted-repeat transposable elements and applications to <it>Anabaena variabilis </it>and <it>Haloquadratum walsbyi</it>.</p></title><aug><au><snm>Chen</snm><fnm>Y</fnm></au><au><snm>Zhou</snm><fnm>F</fnm></au><au><snm>Li</snm><fnm>G</fnm></au><au><snm>Xu</snm><fnm>Y</fnm></au></aug><source>Gene</source><pubdate>2009</pubdate><volume>436</volume><fpage>1</fpage><lpage>7</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.gene.2009.01.019</pubid><pubid idtype="pmpid" link="fulltext">19393167</pubid></pubidlist></xrefbib></bibl><bibl id="B50"><title><p>Differential lineage-specific amplification of transposable elements is responsible for genome size variation in <it>Gossypium</it>.</p></title><aug><au><snm>Hawkins</snm><fnm>JS</fnm></au><au><snm>Kim</snm><fnm>H</fnm></au><au><snm>Nason</snm><fnm>JD</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au><au><snm>Wendel</snm><fnm>JF</fnm></au></aug><source>Genome Res</source><pubdate>2006</pubdate><volume>16</volume><fpage>1252</fpage><lpage>1261</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.5282906</pubid><pubid idtype="pmcid">1581434</pubid><pubid idtype="pmpid" link="fulltext">16954538</pubid></pubidlist></xrefbib></bibl><bibl id="B51"><title><p>LINEs, SINEs and repetitive DNA: non-LTR retrotransposons in plant genomes.</p></title><aug><au><snm>Schmidt</snm><fnm>T</fnm></au></aug><source>Plant Mol Biol</source><pubdate>1999</pubdate><volume>40</volume><fpage>903</fpage><lpage>910</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1023/A:1006212929794</pubid><pubid idtype="pmpid" link="fulltext">10527415</pubid></pubidlist></xrefbib></bibl><bibl id="B52"><title><p>A new method to compute K-mer frequencies and its application to annotate large repetitive plant genomes.</p></title><aug><au><snm>Kurtz</snm><fnm>S</fnm></au><au><snm>Narechania</snm><fnm>A</fnm></au><au><snm>Stein</snm><fnm>JC</fnm></au><au><snm>Ware</snm><fnm>D</fnm></au></aug><source>BMC Genomics</source><pubdate>2008</pubdate><volume>9</volume><fpage>517</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2164-9-517</pubid><pubid idtype="pmcid">2613927</pubid><pubid idtype="pmpid" link="fulltext">18976482</pubid></pubidlist></xrefbib></bibl><bibl id="B53"><title><p>KEW C-Value Database.</p></title><url>http://data.kew.org/cvalues/</url></bibl><bibl id="B54"><title><p>Comparative physical mapping links conservation of microsynteny to chromosome structure and recombination in grasses.</p></title><aug><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Arias</snm><fnm>MA</fnm></au><au><snm>Asher</snm><fnm>R</fnm></au><au><snm>Avise</snm><fnm>JA</fnm></au><au><snm>Ball</snm><fnm>RT</fnm></au><au><snm>Brewer</snm><fnm>GA</fnm></au><au><snm>Buss</snm><fnm>RW</fnm></au><au><snm>Chen</snm><fnm>AH</fnm></au><au><snm>Edwards</snm><fnm>TM</fnm></au><au><snm>Estill</snm><fnm>JC</fnm></au><au><snm>Exum</snm><fnm>HE</fnm></au><au><snm>Goff</snm><fnm>VH</fnm></au><au><snm>Herrick</snm><fnm>KL</fnm></au><au><snm>Steele</snm><fnm>CL</fnm></au><au><snm>Karunakaran</snm><fnm>S</fnm></au><au><snm>Lafayette</snm><fnm>GK</fnm></au><au><snm>Lemke</snm><fnm>C</fnm></au><au><snm>Marler</snm><fnm>BS</fnm></au><au><snm>Masters</snm><fnm>SL</fnm></au><au><snm>McMillan</snm><fnm>JM</fnm></au><au><snm>Nelson</snm><fnm>LK</fnm></au><au><snm>Newsome</snm><fnm>GA</fnm></au><au><snm>Nwakanma</snm><fnm>CC</fnm></au><au><snm>Odeh</snm><fnm>RN</fnm></au><au><snm>Phelps</snm><fnm>CA</fnm></au><au><snm>Rarick</snm><fnm>EA</fnm></au><au><snm>Rogers</snm><fnm>CJ</fnm></au><au><snm>Ryan</snm><fnm>SP</fnm></au><au><snm>Slaughter</snm><fnm>KA</fnm></au><au><snm>Soderlund</snm><fnm>CA</fnm></au><etal/></aug><source>Proc Natl Acad Sci USA</source><pubdate>2005</pubdate><volume>102</volume><fpage>13206</fpage><lpage>13211</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0502365102</pubid><pubid idtype="pmcid">1201573</pubid><pubid idtype="pmpid" link="fulltext">16141333</pubid></pubidlist></xrefbib></bibl><bibl id="B55"><title><p>The Sorghum bicolor genome and the diversification of grasses.</p></title><aug><au><snm>Paterson</snm><fnm>AH</fnm></au><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Bruggmann</snm><fnm>R</fnm></au><au><snm>Dubchak</snm><fnm>I</fnm></au><au><snm>Grimwood</snm><fnm>J</fnm></au><au><snm>Gundlach</snm><fnm>H</fnm></au><au><snm>Haberer</snm><fnm>G</fnm></au><au><snm>Hellsten</snm><fnm>U</fnm></au><au><snm>Mitros</snm><fnm>T</fnm></au><au><snm>Poliakov</snm><fnm>A</fnm></au><au><snm>Schmutz</snm><fnm>J</fnm></au><au><snm>Spannagl</snm><fnm>M</fnm></au><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Wicker</snm><fnm>T</fnm></au><au><snm>Bharti</snm><fnm>AK</fnm></au><au><snm>Chapman</snm><fnm>J</fnm></au><au><snm>Feltus</snm><fnm>FA</fnm></au><au><snm>Gowik</snm><fnm>U</fnm></au><au><snm>Grigoriev</snm><fnm>IV</fnm></au><au><snm>Lyons</snm><fnm>E</fnm></au><au><snm>Maher</snm><fnm>CA</fnm></au><au><snm>Martis</snm><fnm>M</fnm></au><au><snm>Narechania</snm><fnm>A</fnm></au><au><snm>Otillar</snm><fnm>RP</fnm></au><au><snm>Penning</snm><fnm>BW</fnm></au><au><snm>Salamov</snm><fnm>AA</fnm></au><au><snm>Wang</snm><fnm>Y</fnm></au><au><snm>Zhang</snm><fnm>L</fnm></au><au><snm>Carpita</snm><fnm>NC</fnm></au><etal/></aug><source>Nature</source><pubdate>2009</pubdate><volume>457</volume><fpage>551</fpage><lpage>556</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature07723</pubid><pubid idtype="pmpid" link="fulltext">19189423</pubid></pubidlist></xrefbib></bibl><bibl id="B56"><title><p>The B73 maize genome: complexity, diversity, and dynamics.</p></title><aug><au><snm>Schnable</snm><fnm>PS</fnm></au><au><snm>Ware</snm><fnm>D</fnm></au><au><snm>Fulton</snm><fnm>RS</fnm></au><au><snm>Stein</snm><fnm>JC</fnm></au><au><snm>Wei</snm><fnm>F</fnm></au><au><snm>Pasternak</snm><fnm>S</fnm></au><au><snm>Liang</snm><fnm>C</fnm></au><au><snm>Zhang</snm><fnm>J</fnm></au><au><snm>Fulton</snm><fnm>L</fnm></au><au><snm>Graves</snm><fnm>TA</fnm></au><au><snm>Minx</snm><fnm>P</fnm></au><au><snm>Reily</snm><fnm>AD</fnm></au><au><snm>Courtney</snm><fnm>L</fnm></au><au><snm>Kruchowski</snm><fnm>SS</fnm></au><au><snm>Tomlinson</snm><fnm>C</fnm></au><au><snm>Strong</snm><fnm>C</fnm></au><au><snm>Delehaunty</snm><fnm>K</fnm></au><au><snm>Fronick</snm><fnm>C</fnm></au><au><snm>Courtney</snm><fnm>B</fnm></au><au><snm>Rock</snm><fnm>SM</fnm></au><au><snm>Belter</snm><fnm>E</fnm></au><au><snm>Du</snm><fnm>F</fnm></au><au><snm>Kim</snm><fnm>K</fnm></au><au><snm>Abbott</snm><fnm>RM</fnm></au><au><snm>Cotton</snm><fnm>M</fnm></au><au><snm>Levy</snm><fnm>A</fnm></au><au><snm>Marchetto</snm><fnm>P</fnm></au><au><snm>Ochoa</snm><fnm>K</fnm></au><au><snm>Jackson</snm><fnm>SM</fnm></au><au><snm>Gillam</snm><fnm>B</fnm></au><etal/></aug><source>Science</source><pubdate>2009</pubdate><volume>326</volume><fpage>1112</fpage><lpage>1115</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1178534</pubid><pubid idtype="pmpid" link="fulltext">19965430</pubid></pubidlist></xrefbib></bibl><bibl id="B57"><title><p>The age and diversification of angiosperms re-revisited.</p></title><aug><au><snm>Bell</snm><fnm>CD</fnm></au><au><snm>Soltis</snm><fnm>DE</fnm></au><au><snm>Soltis</snm><fnm>P</fnm></au></aug><source>Am J Bot</source><pubdate>2010</pubdate><volume>97</volume><fpage>1296</fpage><lpage>1303</lpage><xrefbib><pubidlist><pubid idtype="doi">10.3732/ajb.0900346</pubid><pubid idtype="pmpid">21616882</pubid></pubidlist></xrefbib></bibl><bibl id="B58"><title><p>Unravelling angiosperm genome evolution by phylogenetic analysis of chromosomal duplication events.</p></title><aug><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Chapman</snm><fnm>BA</fnm></au><au><snm>Rong</snm><fnm>J</fnm></au><au><snm>Paterson</snm><fnm>AH</fnm></au></aug><source>Nature</source><pubdate>2003</pubdate><volume>422</volume><fpage>433</fpage><lpage>438</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature01521</pubid><pubid idtype="pmpid" link="fulltext">12660784</pubid></pubidlist></xrefbib></bibl><bibl id="B59"><title><p>Ancient polyploidization predating divergence of the cereals, and its consequences for comparative genomics.</p></title><aug><au><snm>Paterson</snm><fnm>AH</fnm></au><au><snm>Bowers</snm><fnm>JE</fnm></au><au><snm>Chapman</snm><fnm>BA</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2004</pubdate><volume>101</volume><fpage>9903</fpage><lpage>9908</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0307901101</pubid><pubid idtype="pmcid">470771</pubid><pubid idtype="pmpid" link="fulltext">15161969</pubid></pubidlist></xrefbib></bibl><bibl id="B60"><title><p>The genome of black cottonwood, <it>Populus trichocarpa </it>(Torr. &amp; Gray).</p></title><aug><au><snm>Tuskan</snm><fnm>GA</fnm></au><au><snm>Difazio</snm><fnm>S</fnm></au><au><snm>Jansson</snm><fnm>S</fnm></au><au><snm>Bohlmann</snm><fnm>J</fnm></au><au><snm>Grigoriev</snm><fnm>I</fnm></au><au><snm>Hellsten</snm><fnm>U</fnm></au><au><snm>Putnam</snm><fnm>N</fnm></au><au><snm>Ralph</snm><fnm>S</fnm></au><au><snm>Rombauts</snm><fnm>S</fnm></au><au><snm>Salamov</snm><mnm>Schein</mnm><fnm>AJ</fnm></au><au><snm>Sterck</snm><fnm>L</fnm></au><au><snm>Aerts</snm><fnm>A</fnm></au><au><snm>Bhalerao</snm><fnm>RR</fnm></au><au><snm>Bhalerao</snm><fnm>RP</fnm></au><au><snm>Blaudez</snm><fnm>D</fnm></au><au><snm>Boerjan</snm><fnm>W</fnm></au><au><snm>Brun</snm><fnm>A</fnm></au><au><snm>Brunner</snm><fnm>A</fnm></au><au><snm>Busov</snm><fnm>V</fnm></au><au><snm>Campbell</snm><fnm>M</fnm></au><au><snm>Carlson</snm><fnm>J</fnm></au><au><snm>Chalot</snm><fnm>M</fnm></au><au><snm>Chapman</snm><fnm>J</fnm></au><au><snm>Chen</snm><fnm>GL</fnm></au><au><snm>Cooper</snm><fnm>D</fnm></au><au><snm>Coutinho</snm><fnm>PM</fnm></au><au><snm>Couturier</snm><fnm>J</fnm></au><au><snm>Covert</snm><fnm>S</fnm></au><au><snm>Cronk</snm><fnm>Q</fnm></au><au><snm>Cunningham</snm><fnm>R</fnm></au><etal/></aug><source>Science</source><pubdate>2006</pubdate><volume>313</volume><fpage>1596</fpage><lpage>1604</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1128691</pubid><pubid idtype="pmpid" link="fulltext">16973872</pubid></pubidlist></xrefbib></bibl><bibl id="B61"><title><p>The DAWGPAWS pipeline for the annotation of genes and transposable elements in plant genomes.</p></title><aug><au><snm>Estill</snm><fnm>JC</fnm></au><au><snm>Bennetzen</snm><fnm>JL</fnm></au></aug><source>Plant Methods</source><pubdate>2009</pubdate><volume>5</volume><fpage>8</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1746-4811-5-8</pubid><pubid idtype="pmcid">2705364</pubid><pubid idtype="pmpid" link="fulltext">19545381</pubid></pubidlist></xrefbib></bibl><bibl id="B62"><title><p>DAWGPAWS.</p></title><url>http://dawgpaws.sourceforge.net</url></bibl><bibl id="B63"><title><p>FGENESH.</p></title><url>http://softberry.com</url></bibl><bibl id="B64"><title><p>Gene prediction in eukaryotes with a generalized hidden Markov model that uses hints from external sources.</p></title><aug><au><snm>Stanke</snm><fnm>M</fnm></au><au><snm>Schoffmann</snm><fnm>O</fnm></au><au><snm>Morgenstern</snm><fnm>B</fnm></au><au><snm>Waack</snm><fnm>S</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2006</pubdate><volume>7</volume><fpage>62</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-7-62</pubid><pubid idtype="pmcid">1409804</pubid><pubid idtype="pmpid" link="fulltext">16469098</pubid></pubidlist></xrefbib></bibl><bibl id="B65"><title><p>Gene finding in novel genomes.</p></title><aug><au><snm>Korf</snm><fnm>I</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2004</pubdate><volume>5</volume><fpage>59</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-5-59</pubid><pubid idtype="pmcid">421630</pubid><pubid idtype="pmpid" link="fulltext">15144565</pubid></pubidlist></xrefbib></bibl><bibl id="B66"><title><p>Computational gene annotation in new genome assemblies using GeneID.</p></title><aug><au><snm>Blanco</snm><fnm>E</fnm></au><au><snm>Abril</snm><fnm>JF</fnm></au></aug><source>Methods Mol Biol</source><pubdate>2009</pubdate><volume>537</volume><fpage>243</fpage><lpage>261</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1007/978-1-59745-251-9_12</pubid><pubid idtype="pmpid" link="fulltext">19378148</pubid></pubidlist></xrefbib></bibl><bibl id="B67"><title><p>Prediction of complete gene structures in human genomic DNA.</p></title><aug><au><snm>Burge</snm><fnm>C</fnm></au><au><snm>Karlin</snm><fnm>S</fnm></au></aug><source>J Mol Biol</source><pubdate>1997</pubdate><volume>268</volume><fpage>78</fpage><lpage>94</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1006/jmbi.1997.0951</pubid><pubid idtype="pmpid" link="fulltext">9149143</pubid></pubidlist></xrefbib></bibl><bibl id="B68"><title><p>GMAP: a genomic mapping and alignment program for mRNA and EST sequences.</p></title><aug><au><snm>Wu</snm><fnm>TD</fnm></au><au><snm>Watanabe</snm><fnm>CK</fnm></au></aug><source>Bioinformatics</source><pubdate>2005</pubdate><volume>21</volume><fpage>1859</fpage><lpage>1875</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/bti310</pubid><pubid idtype="pmpid" link="fulltext">15728110</pubid></pubidlist></xrefbib></bibl><bibl id="B69"><title><p>Improving the <it>Arabidopsis </it>genome annotation using maximal transcript alignment assemblies.</p></title><aug><au><snm>Haas</snm><fnm>BJ</fnm></au><au><snm>Delcher</snm><fnm>AL</fnm></au><au><snm>Mount</snm><fnm>SM</fnm></au><au><snm>Wortman</snm><fnm>JR</fnm></au><au><snm>Smith</snm><fnm>RK</fnm><suf>Jr</suf></au><au><snm>Hannick</snm><fnm>LI</fnm></au><au><snm>Maiti</snm><fnm>R</fnm></au><au><snm>Ronning</snm><fnm>CM</fnm></au><au><snm>Rusch</snm><fnm>DB</fnm></au><au><snm>Town</snm><fnm>CD</fnm></au><au><snm>Salzberg</snm><fnm>SL</fnm></au><au><snm>White</snm><fnm>O</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2003</pubdate><volume>31</volume><fpage>5654</fpage><lpage>5666</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkg770</pubid><pubid idtype="pmcid">206470</pubid><pubid idtype="pmpid" link="fulltext">14500829</pubid></pubidlist></xrefbib></bibl><bibl id="B70"><title><p>The <it>Arabidopsis </it>Information Resource (TAIR): gene structure and function annotation.</p></title><aug><au><snm>Swarbreck</snm><fnm>D</fnm></au><au><snm>Wilks</snm><fnm>C</fnm></au><au><snm>Lamesch</snm><fnm>P</fnm></au><au><snm>Berardini</snm><fnm>TZ</fnm></au><au><snm>Garcia-Hernandez</snm><fnm>M</fnm></au><au><snm>Foerster</snm><fnm>H</fnm></au><au><snm>Li</snm><fnm>D</fnm></au><au><snm>Meyer</snm><fnm>T</fnm></au><au><snm>Muller</snm><fnm>R</fnm></au><au><snm>Ploetz</snm><fnm>L</fnm></au><au><snm>Radenbaugh</snm><fnm>A</fnm></au><au><snm>Singh</snm><fnm>S</fnm></au><au><snm>Swing</snm><fnm>V</fnm></au><au><snm>Tissier</snm><fnm>C</fnm></au><au><snm>Zhang</snm><fnm>P</fnm></au><au><snm>Huala</snm><fnm>E</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2008</pubdate><volume>36</volume><fpage>D1009</fpage><lpage>1014</lpage><xrefbib><pubidlist><pubid idtype="pmcid">2238962</pubid><pubid idtype="pmpid" link="fulltext">17986450</pubid></pubidlist></xrefbib></bibl><bibl id="B71"><title><p>Legume genome evolution viewed through the Medicago truncatula and Lotus japonicus genomes.</p></title><aug><au><snm>Cannon</snm><fnm>SB</fnm></au><au><snm>Sterck</snm><fnm>L</fnm></au><au><snm>Rombauts</snm><fnm>S</fnm></au><au><snm>Sato</snm><fnm>S</fnm></au><au><snm>Cheung</snm><fnm>F</fnm></au><au><snm>Gouzy</snm><fnm>J</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Mudge</snm><fnm>J</fnm></au><au><snm>Vasdewani</snm><fnm>J</fnm></au><au><snm>Schiex</snm><fnm>T</fnm></au><au><snm>Spannagl</snm><fnm>M</fnm></au><au><snm>Monaghan</snm><fnm>E</fnm></au><au><snm>Nicholson</snm><fnm>C</fnm></au><au><snm>Humphray</snm><fnm>SJ</fnm></au><au><snm>Schoof</snm><fnm>H</fnm></au><au><snm>Mayer</snm><fnm>KF</fnm></au><au><snm>Rogers</snm><fnm>J</fnm></au><au><snm>Quetier</snm><fnm>F</fnm></au><au><snm>Oldroyd</snm><fnm>GE</fnm></au><au><snm>Debelle</snm><fnm>F</fnm></au><au><snm>Cook</snm><fnm>DR</fnm></au><au><snm>Retzel</snm><fnm>EF</fnm></au><au><snm>Roe</snm><fnm>BA</fnm></au><au><snm>Town</snm><fnm>CD</fnm></au><au><snm>Tabata</snm><fnm>S</fnm></au><au><snm>Van de Peer</snm><fnm>Y</fnm></au><au><snm>Young</snm><fnm>ND</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2006</pubdate><volume>103</volume><fpage>14959</fpage><lpage>14964</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0603228103</pubid><pubid idtype="pmcid">1578499</pubid><pubid idtype="pmpid" link="fulltext">17003129</pubid></pubidlist></xrefbib></bibl><bibl id="B72"><title><p>Curated genome annotation of <it>Oryza sativa </it>ssp. japonica and comparative genome analysis with <it>Arabidopsis thaliana</it>.</p></title><aug><au><snm>Itoh</snm><fnm>T</fnm></au><au><snm>Tanaka</snm><fnm>T</fnm></au><au><snm>Barrero</snm><fnm>RA</fnm></au><au><snm>Yamasaki</snm><fnm>C</fnm></au><au><snm>Fujii</snm><fnm>Y</fnm></au><au><snm>Hilton</snm><fnm>PB</fnm></au><au><snm>Antonio</snm><fnm>BA</fnm></au><au><snm>Aono</snm><fnm>H</fnm></au><au><snm>Apweiler</snm><fnm>R</fnm></au><au><snm>Bruskiewich</snm><fnm>R</fnm></au><au><snm>Bureau</snm><fnm>T</fnm></au><au><snm>Burr</snm><fnm>F</fnm></au><au><snm>Costa de Oliveira</snm><fnm>A</fnm></au><au><snm>Fuks</snm><fnm>G</fnm></au><au><snm>Habara</snm><fnm>T</fnm></au><au><snm>Haberer</snm><fnm>G</fnm></au><au><snm>Han</snm><fnm>B</fnm></au><au><snm>Harada</snm><fnm>E</fnm></au><au><snm>Hiraki</snm><fnm>AT</fnm></au><au><snm>Hirochika</snm><fnm>H</fnm></au><au><snm>Hoen</snm><fnm>D</fnm></au><au><snm>Hokari</snm><fnm>H</fnm></au><au><snm>Hosokawa</snm><fnm>S</fnm></au><au><snm>Hsing</snm><fnm>YI</fnm></au><au><snm>Ikawa</snm><fnm>H</fnm></au><au><snm>Ikeo</snm><fnm>K</fnm></au><au><snm>Imanishi</snm><fnm>T</fnm></au><au><snm>Ito</snm><fnm>Y</fnm></au><au><snm>Jaiswal</snm><fnm>P</fnm></au><au><snm>Kanno</snm><fnm>M</fnm></au><etal/></aug><source>Genome Res</source><pubdate>2007</pubdate><volume>17</volume><fpage>175</fpage><lpage>183</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.5509507</pubid><pubid idtype="pmcid">1781349</pubid><pubid idtype="pmpid" link="fulltext">17210932</pubid></pubidlist></xrefbib></bibl><bibl id="B73"><title><p>The map-based sequence of the rice genome.</p></title><aug><au><snm>Project</snm><fnm>IRGS</fnm></au></aug><source>Nature</source><pubdate>2005</pubdate><volume>436</volume><fpage>793</fpage><lpage>800</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature03895</pubid><pubid idtype="pmpid" link="fulltext">16100779</pubid></pubidlist></xrefbib></bibl><bibl id="B74"><title><p>Improved pairwise alignment of genomic DNA.</p></title><aug><au><snm>Harris</snm><fnm>RS</fnm></au></aug><source>PhD Thesis</source><publisher>Pennsylvania State University, Biology Department</publisher><pubdate>2007</pubdate></bibl><bibl id="B75"><title><p>Miller Lab Software.</p></title><url>http://www.bx.psu.edu/miller_lab/</url></bibl><bibl id="B76"><title><p>OrthoMCL: identification of ortholog groups for eukaryotic genomes.</p></title><aug><au><snm>Li</snm><fnm>L</fnm></au><au><snm>Stoeckert</snm><fnm>CJ</fnm><suf>Jr</suf></au><au><snm>Roos</snm><fnm>DS</fnm></au></aug><source>Genome Res</source><pubdate>2003</pubdate><volume>13</volume><fpage>2178</fpage><lpage>2189</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.1224503</pubid><pubid idtype="pmcid">403725</pubid><pubid idtype="pmpid" link="fulltext">12952885</pubid></pubidlist></xrefbib></bibl><bibl id="B77"><title><p>PlantGDB: a resource for comparative plant genomics.</p></title><aug><au><snm>Duvick</snm><fnm>J</fnm></au><au><snm>Fu</snm><fnm>A</fnm></au><au><snm>Muppirala</snm><fnm>U</fnm></au><au><snm>Sabharwal</snm><fnm>M</fnm></au><au><snm>Wilkerson</snm><fnm>MD</fnm></au><au><snm>Lawrence</snm><fnm>CJ</fnm></au><au><snm>Lushbough</snm><fnm>C</fnm></au><au><snm>Brendel</snm><fnm>V</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2008</pubdate><volume>36</volume><fpage>D959</fpage><lpage>965</lpage><xrefbib><pubidlist><pubid idtype="pmcid">2238959</pubid><pubid idtype="pmpid" link="fulltext">18063570</pubid></pubidlist></xrefbib></bibl><bibl id="B78"><title><p>PlantGDB.</p></title><url>http://www.plantgdb.org/</url></bibl><bibl id="B79"><title><p>MUSCLE: a multiple sequence alignment method with reduced time and space complexity.</p></title><aug><au><snm>Edgar</snm><fnm>RC</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2004</pubdate><volume>5</volume><fpage>113</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-5-113</pubid><pubid idtype="pmcid">517706</pubid><pubid idtype="pmpid" link="fulltext">15318951</pubid></pubidlist></xrefbib></bibl><bibl id="B80"><title><p>RAxML-VI-HPC: maximum likelihood-based phylogenetic analyses with thousands of taxa and mixed models.</p></title><aug><au><snm>Stamatakis</snm><fnm>A</fnm></au></aug><source>Bioinformatics</source><pubdate>2006</pubdate><volume>22</volume><fpage>2688</fpage><lpage>2690</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btl446</pubid><pubid idtype="pmpid" link="fulltext">16928733</pubid></pubidlist></xrefbib></bibl><bibl id="B81"><title><p>The draft genome of the transgenic tropical fruit tree papaya (Carica papaya Linnaeus).</p></title><aug><au><snm>Ming</snm><fnm>R</fnm></au><au><snm>Hou</snm><fnm>S</fnm></au><au><snm>Feng</snm><fnm>Y</fnm></au><au><snm>Yu</snm><fnm>Q</fnm></au><au><snm>Dionne-Laporte</snm><fnm>A</fnm></au><au><snm>Saw</snm><fnm>JH</fnm></au><au><snm>Senin</snm><fnm>P</fnm></au><au><snm>Wang</snm><fnm>W</fnm></au><au><snm>Ly</snm><fnm>BV</fnm></au><au><snm>Lewis</snm><fnm>KL</fnm></au><au><snm>Salzberg</snm><fnm>SL</fnm></au><au><snm>Feng</snm><fnm>L</fnm></au><au><snm>Jones</snm><fnm>MR</fnm></au><au><snm>Skelton</snm><fnm>RL</fnm></au><au><snm>Murray</snm><fnm>JE</fnm></au><au><snm>Chen</snm><fnm>C</fnm></au><au><snm>Qian</snm><fnm>W</fnm></au><au><snm>Shen</snm><fnm>J</fnm></au><au><snm>Du</snm><fnm>P</fnm></au><au><snm>Eustice</snm><fnm>M</fnm></au><au><snm>Tong</snm><fnm>E</fnm></au><au><snm>Tang</snm><fnm>H</fnm></au><au><snm>Lyons</snm><fnm>E</fnm></au><au><snm>Paull</snm><fnm>RE</fnm></au><au><snm>Michael</snm><fnm>TP</fnm></au><au><snm>Wall</snm><fnm>K</fnm></au><au><snm>Rice</snm><fnm>DW</fnm></au><au><snm>Albert</snm><fnm>H</fnm></au><au><snm>Wang</snm><fnm>ML</fnm></au><au><snm>Zhu</snm><fnm>YJ</fnm></au><etal/></aug><source>Nature</source><pubdate>2008</pubdate><volume>452</volume><fpage>991</fpage><lpage>996</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06856</pubid><pubid idtype="pmcid">2836516</pubid><pubid idtype="pmpid" link="fulltext">18432245</pubid></pubidlist></xrefbib></bibl><bibl id="B82"><title><p>An improved method for plant BAC library construction.</p></title><aug><au><snm>Luo</snm><fnm>M</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au></aug><source>Methods Mol Biol</source><pubdate>2003</pubdate><volume>236</volume><fpage>3</fpage><lpage>20</lpage><xrefbib><pubid idtype="pmpid">14501055</pubid></xrefbib></bibl><bibl id="B83"><title><p>Comparative physical mapping between <it>Oryza sativa </it>(AA genome type) and <it>O. punctata </it>(BB genome type).</p></title><aug><au><snm>Kim</snm><fnm>H</fnm></au><au><snm>San Miguel</snm><fnm>P</fnm></au><au><snm>Nelson</snm><fnm>W</fnm></au><au><snm>Collura</snm><fnm>K</fnm></au><au><snm>Wissotski</snm><fnm>M</fnm></au><au><snm>Walling</snm><fnm>JG</fnm></au><au><snm>Kim</snm><fnm>JP</fnm></au><au><snm>Jackson</snm><fnm>SA</fnm></au><au><snm>Soderlund</snm><fnm>C</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au></aug><source>Genetics</source><pubdate>2007</pubdate><volume>176</volume><fpage>379</fpage><lpage>390</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1534/genetics.106.068783</pubid><pubid idtype="pmcid">1893071</pubid><pubid idtype="pmpid" link="fulltext">17339227</pubid></pubidlist></xrefbib></bibl><bibl id="B84"><title><p>The <it>Oryza </it>bacterial artificial chromosome library resource: construction and analysis of 12 deep-coverage large-insert BAC libraries that represent the 10 genome types of the genus <it>Oryza</it>.</p></title><aug><au><snm>Ammiraju</snm><fnm>JS</fnm></au><au><snm>Luo</snm><fnm>M</fnm></au><au><snm>Goicoechea</snm><fnm>JL</fnm></au><au><snm>Wang</snm><fnm>W</fnm></au><au><snm>Kudrna</snm><fnm>D</fnm></au><au><snm>Mueller</snm><fnm>C</fnm></au><au><snm>Talag</snm><fnm>J</fnm></au><au><snm>Kim</snm><fnm>H</fnm></au><au><snm>Sisneros</snm><fnm>NB</fnm></au><au><snm>Blackmon</snm><fnm>B</fnm></au><au><snm>Fang</snm><fnm>E</fnm></au><au><snm>Tomkins</snm><fnm>JB</fnm></au><au><snm>Brar</snm><fnm>D</fnm></au><au><snm>MacKill</snm><fnm>D</fnm></au><au><snm>McCouch</snm><fnm></fnm></au><au><snm>Kurata</snm><fnm>N</fnm></au><au><snm>Lambert</snm><fnm>G</fnm></au><au><snm>Galbraith</snm><fnm>DW</fnm></au><au><snm>Arumuganathan</snm><fnm>K</fnm></au><au><snm>K</snm><fnm>Rao</fnm></au><au><snm>Walling</snm><fnm>SJ</fnm></au><au><snm>Gill</snm><fnm>N</fnm></au><au><snm>Yu</snm><fnm>Y</fnm></au><au><snm>SanMiguel</snm><fnm>P</fnm></au><au><snm>Soderlund</snm><fnm>C</fnm></au><au><snm>Jackson</snm><fnm>S</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au></aug><source>Genome Res</source><pubdate>2006</pubdate><volume>16</volume><fpage>140</fpage><lpage>147</lpage><xrefbib><pubidlist><pubid idtype="pmcid">1356138</pubid><pubid idtype="pmpid" link="fulltext">16344555</pubid></pubidlist></xrefbib></bibl><bibl id="B85"><title><p>Base-calling of automated sequencer traces using phred. I. Accuracy assessment.</p></title><aug><au><snm>Ewing</snm><fnm>B</fnm></au><au><snm>Hillier</snm><fnm>L</fnm></au><au><snm>Wendl</snm><fnm>MC</fnm></au><au><snm>Green</snm><fnm>P</fnm></au></aug><source>Genome Res</source><pubdate>1998</pubdate><volume>8</volume><fpage>175</fpage><lpage>185</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">9521921</pubid></xrefbib></bibl><bibl id="B86"><title><p>DNA sequence quality trimming and vector removal.</p></title><aug><au><snm>Chou</snm><fnm>HH</fnm></au><au><snm>Holmes</snm><fnm>MH</fnm></au></aug><source>Bioinformatics</source><pubdate>2001</pubdate><volume>17</volume><fpage>1093</fpage><lpage>1104</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/17.12.1093</pubid><pubid idtype="pmpid" link="fulltext">11751217</pubid></pubidlist></xrefbib></bibl><bibl id="B87"><title><p>Transposable element distribution, abundance and role in genome size variation in the genus <it>Oryza</it>.</p></title><aug><au><snm>Zuccolo</snm><fnm>A</fnm></au><au><snm>Sebastian</snm><fnm>A</fnm></au><au><snm>Talag</snm><fnm>J</fnm></au><au><snm>Yu</snm><fnm>Y</fnm></au><au><snm>Kim</snm><fnm>H</fnm></au><au><snm>Collura</snm><fnm>K</fnm></au><au><snm>Kudrna</snm><fnm>D</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au></aug><source>BMC Evol Biol</source><pubdate>2007</pubdate><volume>7</volume><fpage>152</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2148-7-152</pubid><pubid idtype="pmcid">2041954</pubid><pubid idtype="pmpid" link="fulltext">17727727</pubid></pubidlist></xrefbib></bibl><bibl id="B88"><title><p>SeqClean.</p></title><url>http://sourceforge.net/projects/seqclean/</url></bibl><bibl id="B89"><title><p>Using the miraEST assembler for reliable and automated mRNA transcript assembly and SNP detection in sequenced ESTs.</p></title><aug><au><snm>Chevreux</snm><fnm>B</fnm></au><au><snm>Pfisterer</snm><fnm>T</fnm></au><au><snm>Drescher</snm><fnm>B</fnm></au><au><snm>Driesel</snm><fnm>AJ</fnm></au><au><snm>Muller</snm><fnm>WE</fnm></au><au><snm>Wetter</snm><fnm>T</fnm></au><au><snm>Suhai</snm><fnm>S</fnm></au></aug><source>Genome Res</source><pubdate>2004</pubdate><volume>14</volume><fpage>1147</fpage><lpage>1159</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.1917404</pubid><pubid idtype="pmcid">419793</pubid><pubid idtype="pmpid" link="fulltext">15140833</pubid></pubidlist></xrefbib></bibl><bibl id="B90"><title><p>A dot-matrix program with dynamic threshold control suited for genomic DNA and protein sequence analysis.</p></title><aug><au><snm>Sonnhammer</snm><fnm>EL</fnm></au><au><snm>Durbin</snm><fnm>R</fnm></au></aug><source>Gene</source><pubdate>1995</pubdate><volume>167</volume><fpage>GC1</fpage><lpage>10</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/0378-1119(95)00714-8</pubid><pubid idtype="pmpid">8566757</pubid></pubidlist></xrefbib></bibl><bibl id="B91"><title><p>Sputnik.</p></title><url>http://espressosoftware.com/sputnik/index.html</url></bibl><bibl id="B92"><title><p>Microsatellites are preferentially associated with nonrepetitive DNA in plant genomes.</p></title><aug><au><snm>Morgante</snm><fnm>M</fnm></au><au><snm>Hanafey</snm><fnm>M</fnm></au><au><snm>Powell</snm><fnm>W</fnm></au></aug><source>Nat Genet</source><pubdate>2002</pubdate><volume>30</volume><fpage>194</fpage><lpage>200</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/ng822</pubid><pubid idtype="pmpid" link="fulltext">11799393</pubid></pubidlist></xrefbib></bibl><bibl id="B93"><title><p>Integration of genetic, physical, and cytogenetic maps for Brassica rapa chromosome A7.</p></title><aug><au><snm>Xiong</snm><fnm>Z</fnm></au><au><snm>Kim</snm><fnm>JS</fnm></au><au><snm>Pires</snm><fnm>JC</fnm></au></aug><source>Cytogenet Genome Res</source><pubdate>2010</pubdate><volume>129</volume><fpage>190</fpage><lpage>198</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1159/000314640</pubid><pubid idtype="pmpid" link="fulltext">20628251</pubid></pubidlist></xrefbib></bibl><bibl id="B94"><title><p>Apollo: a community resource for genome annotation editing.</p></title><aug><au><snm>Lee</snm><fnm>E</fnm></au><au><snm>Harris</snm><fnm>N</fnm></au><au><snm>Gibson</snm><fnm>M</fnm></au><au><snm>Chetty</snm><fnm>R</fnm></au><au><snm>Lewis</snm><fnm>S</fnm></au></aug><source>Bioinformatics</source><pubdate>2009</pubdate><volume>25</volume><fpage>1836</fpage><lpage>1837</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btp314</pubid><pubid idtype="pmcid">2705230</pubid><pubid idtype="pmpid" link="fulltext">19439563</pubid></pubidlist></xrefbib></bibl><bibl id="B95"><title><p>The generic genome browser: a building block for a model organism system database.</p></title><aug><au><snm>Stein</snm><fnm>LD</fnm></au><au><snm>Mungall</snm><fnm>C</fnm></au><au><snm>Shu</snm><fnm>S</fnm></au><au><snm>Caudy</snm><fnm>M</fnm></au><au><snm>Mangone</snm><fnm>M</fnm></au><au><snm>Day</snm><fnm>A</fnm></au><au><snm>Nickerson</snm><fnm>E</fnm></au><au><snm>Stajich</snm><fnm>JE</fnm></au><au><snm>Harris</snm><fnm>TW</fnm></au><au><snm>Arva</snm><fnm>A</fnm></au><au><snm>Lewis</snm><fnm>S</fnm></au></aug><source>Genome Res</source><pubdate>2002</pubdate><volume>12</volume><fpage>1599</fpage><lpage>1610</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.403602</pubid><pubid idtype="pmcid">187535</pubid><pubid idtype="pmpid" link="fulltext">12368253</pubid></pubidlist></xrefbib></bibl><bibl id="B96"><title><p>Rice Annotation Project.</p></title><url>http://rapdb.dna.affrc.go.jp/</url></bibl><bibl id="B97"><title><p>Grape Genome Browser.</p></title><url>http://www.genoscope.cns.fr/externe/GenomeBrowser/Vitis/</url></bibl></refgrp>
</bm></art>