<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art><ui>gb-2011-12-2-r20</ui><ji>GBJ</ji><fm>
<dochead>Research</dochead>
<bibl>
<title>
<p>Comparative genomics of the social amoebae <it>Dictyostelium discoideum </it>and <it>Dictyostelium purpureum</it>
</p>
</title>
<aug>
<au id="A1" ce="yes"><snm>Sucgang</snm><fnm>Richard</fnm><insr iid="I1"/><email>rsucgang@bcm.edu</email></au>
<au id="A2" ce="yes"><snm>Kuo</snm><fnm>Alan</fnm><insr iid="I2"/><email>akuo@lbl.gov</email></au>
<au id="A3" ce="yes"><snm>Tian</snm><fnm>Xiangjun</fnm><insr iid="I3"/><email>akuspa@bcm.edu</email></au>
<au id="A4" ce="yes"><snm>Salerno</snm><fnm>William</fnm><insr iid="I1"/><email>akuspa@bcm.edu</email></au>
<au id="A5"><snm>Parikh</snm><fnm>Anup</fnm><insr iid="I4"/><email>akuspa@bcm.edu</email></au>
<au id="A6"><snm>Feasley</snm><mi>L</mi><fnm>Christa</fnm><insr iid="I5"/><email>akuspa@bcm.edu</email></au>
<au id="A7"><snm>Dalin</snm><fnm>Eileen</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A8"><snm>Tu</snm><fnm>Hank</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A9"><snm>Huang</snm><fnm>Eryong</fnm><insr iid="I4"/><email>akuspa@bcm.edu</email></au>
<au id="A10"><snm>Barry</snm><fnm>Kerrie</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A11"><snm>Lindquist</snm><fnm>Erika</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A12"><snm>Shapiro</snm><fnm>Harris</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A13"><snm>Bruce</snm><fnm>David</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A14"><snm>Schmutz</snm><fnm>Jeremy</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A15"><snm>Salamov</snm><fnm>Asaf</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
<au id="A16"><snm>Fey</snm><fnm>Petra</fnm><insr iid="I6"/><email>akuspa@bcm.edu</email></au>
<au id="A17"><snm>Gaudet</snm><fnm>Pascale</fnm><insr iid="I6"/><email>akuspa@bcm.edu</email></au>
<au id="A18"><snm>Anjard</snm><fnm>Christophe</fnm><insr iid="I7"/><email>akuspa@bcm.edu</email></au>
<au id="A19"><snm>Babu</snm><fnm>M Madan</fnm><insr iid="I8"/><email>akuspa@bcm.edu</email></au>
<au id="A20"><snm>Basu</snm><fnm>Siddhartha</fnm><insr iid="I6"/><email>akuspa@bcm.edu</email></au>
<au id="A21"><snm>Bushmanova</snm><fnm>Yulia</fnm><insr iid="I6"/><email>akuspa@bcm.edu</email></au>
<au id="A22"><snm>van der Wel</snm><fnm>Hanke</fnm><insr iid="I5"/><email>akuspa@bcm.edu</email></au>
<au id="A23"><snm>Katoh-Kurasawa</snm><fnm>Mariko</fnm><insr iid="I4"/><email>akuspa@bcm.edu</email></au>
<au id="A24"><snm>Dinh</snm><fnm>Christopher</fnm><insr iid="I1"/><email>akuspa@bcm.edu</email></au>
<au id="A25"><snm>Coutinho</snm><mi>M</mi><fnm>Pedro</fnm><insr iid="I9"/><email>akuspa@bcm.edu</email></au>
<au id="A26"><snm>Saito</snm><fnm>Tamao</fnm><insr iid="I10"/><email>akuspa@bcm.edu</email></au>
<au id="A27"><snm>Elias</snm><fnm>Marek</fnm><insr iid="I11"/><email>akuspa@bcm.edu</email></au>
<au id="A28"><snm>Schaap</snm><fnm>Pauline</fnm><insr iid="I12"/><email>akuspa@bcm.edu</email></au>
<au id="A29"><snm>Kay</snm><mi>R</mi><fnm>Robert</fnm><insr iid="I8"/><email>akuspa@bcm.edu</email></au>
<au id="A30"><snm>Henrissat</snm><fnm>Bernard</fnm><insr iid="I9"/><email>akuspa@bcm.edu</email></au>
<au id="A31"><snm>Eichinger</snm><fnm>Ludwig</fnm><insr iid="I13"/><email>akuspa@bcm.edu</email></au>
<au id="A32"><snm>Rivero</snm><fnm>Francisco</fnm><insr iid="I14"/><email>akuspa@bcm.edu</email></au>
<au id="A33"><snm>Putnam</snm><mi>H</mi><fnm>Nicholas</fnm><insr iid="I3"/><email>akuspa@bcm.edu</email></au>
<au id="A34"><snm>West</snm><mi>M</mi><fnm>Christopher</fnm><insr iid="I5"/><email>akuspa@bcm.edu</email></au>
<au id="A35"><snm>Loomis</snm><mi>F</mi><fnm>William</fnm><insr iid="I7"/><email>akuspa@bcm.edu</email></au>
<au id="A36"><snm>Chisholm</snm><mi>L</mi><fnm>Rex</fnm><insr iid="I6"/><email>akuspa@bcm.edu</email></au>
<au id="A37"><snm>Shaulsky</snm><fnm>Gad</fnm><insr iid="I3"/><insr iid="I4"/><email>akuspa@bcm.edu</email></au>
<au id="A38"><snm>Strassmann</snm><mi>E</mi><fnm>Joan</fnm><insr iid="I3"/><email>akuspa@bcm.edu</email></au>
<au id="A39"><snm>Queller</snm><mi>C</mi><fnm>David</fnm><insr iid="I3"/><email>akuspa@bcm.edu</email></au>
<au ca="yes" id="A40"><snm>Kuspa</snm><fnm>Adam</fnm><insr iid="I1"/><insr iid="I3"/><insr iid="I4"/><email>akuspa@bcm.edu</email></au>
<au id="A41"><snm>Grigoriev</snm><mi>V</mi><fnm>Igor</fnm><insr iid="I2"/><email>akuspa@bcm.edu</email></au>
</aug>
<insg>
<ins id="I1"><p>Verna and Marrs McLean Department of Biochemistry and Molecular Biology, Baylor College of Medicine, One Baylor Plaza, Houston, TX 77030, USA</p></ins>
<ins id="I2"><p>US Department of Energy Joint Genome Institute, 2800 Mitchell Drive, Walnut Creek, CA 9458, USA</p></ins>
<ins id="I3"><p>Department of Ecology and Evolutionary Biology, Rice University, 6100 Main Street, Houston, TX 77005, USA</p></ins>
<ins id="I4"><p>Department of Molecular and Human Genetics, Baylor College of Medicine, One Baylor Plaza, Houston, TX 77030, USA</p></ins>
<ins id="I5"><p>Department of Biochemistry and Molecular Biology, Oklahoma Center for Medical Glycobiology, University of Oklahoma Health Sciences Center, 110 N. Lindsay, Oklahoma City, OK 73104, USA</p></ins>
<ins id="I6"><p>dictyBase, Center for Genetic Medicine, Northwestern University, 750 N. Lake Shore Drive, Chicago, IL 60611, USA</p></ins>
<ins id="I7"><p>Section of Cell and Developmental Biology, Division of Biology, University of California, 9500 Gilman Dr, San Diego, La Jolla, CA 92093, USA</p></ins>
<ins id="I8"><p>Laboratory of Molecular Biology, MRC Centre, Hills Road, Cambridge CB2 2QH, UK</p></ins>
<ins id="I9"><p>Architecture et Fonction des Macromol&#233;cules Biologiques, UMR6098, CNRS, Universities of Aix-Marseille I &amp; II, 13288 Marseille, France</p></ins>
<ins id="I10"><p>Department of Materials and Life Sciences, Sophia University 7-1 Kioi-Cho, Chiyoda-Ku, Tokyo 102-8554, Japan</p></ins>
<ins id="I11"><p>Departments of Botany and Parasitology, Faculty of Science, Charles University in Prague, Albertov 6, Prague 128 43, Czech Republic</p></ins>
<ins id="I12"><p>College of Life Sciences, University of Dundee, Dow Street, Dundee, DD15EH, UK</p></ins>
<ins id="I13"><p>Center for Molecular Medicine Cologne, University of Cologne, Joseph-Stelzmann-Str. 52, 50931 Cologne, Germany</p></ins>
<ins id="I14"><p>Centre for Biomedical Research, The Hull York Medical School and Department of Biological Sciences, University of Hull, Hull, HU6 7RX, UK</p></ins>
</insg>
<source>Genome Biology</source>
<issn>1465-6906</issn>
<pubdate>2011</pubdate>
<volume>12</volume>
<issue>2</issue>
<fpage>R20</fpage>
<url>http://genomebiology.com/2011/12/2/R20</url>
<xrefbib><pubidlist><pubid idtype="doi">10.1186/gb-2011-12-2-r20</pubid><pubid idtype="pmpid">21356102</pubid></pubidlist></xrefbib>
</bibl>
<history><rec><date><day>20</day><month>7</month><year>2010</year></date></rec><revrec><date><day>9</day><month>12</month><year>2010</year></date></revrec><acc><date><day>28</day><month>2</month><year>2011</year></date></acc><pub><date><day>28</day><month>2</month><year>2011</year></date></pub></history>
<cpyrt><year>2011</year><collab>Sucgang et al.; licensee BioMed Central Ltd.</collab><note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note></cpyrt>
<abs>
<sec>
<st>
<p>Abstract</p>
</st>
<sec>
<st>
<p>Background</p>
</st>
<p>The social amoebae (Dictyostelia) are a diverse group of Amoebozoa that achieve multicellularity by aggregation and undergo morphogenesis into fruiting bodies with terminally differentiated spores and stalk cells. There are four groups of dictyostelids, with the most derived being a group that contains the model species <it>Dictyostelium discoideum</it>.</p>
</sec>
<sec>
<st>
<p>Results</p>
</st>
<p>We have produced a draft genome sequence of another group dictyostelid, <it>Dictyostelium </it>
<it>purpureum</it>, and compare it to the <it>D. discoideum </it>genome. The assembly (8.41 &#215; coverage) comprises 799 scaffolds totaling 33.0 Mb, comparable to the <it>D. discoideum </it>genome size. Sequence comparisons suggest that these two dictyostelids shared a common ancestor approximately 400 million years ago. In spite of this divergence, most orthologs reside in small clusters of conserved synteny. Comparative analyses revealed a core set of orthologous genes that illuminate dictyostelid physiology, as well as differences in gene family content. Interesting patterns of gene conservation and divergence are also evident, suggesting function differences; some protein families, such as the histidine kinases, have undergone little functional change, whereas others, such as the polyketide synthases, have undergone extensive diversification. The abundant amino acid homopolymers encoded in both genomes are generally not found in homologous positions within proteins, so they are unlikely to derive from ancestral DNA triplet repeats. Genes involved in the social stage evolved more rapidly than others, consistent with either relaxed selection or accelerated evolution due to social conflict.</p>
</sec>
<sec>
<st>
<p>Conclusions</p>
</st>
<p>The findings from this new genome sequence and comparative analysis shed light on the biology and evolution of the Dictyostelia.</p>
</sec>
</sec>
</abs>
</fm><meta>
<classifications>
<classification id="300100010" subtype="man_spc_id" type="BMC">Genome studies</classification>
<classification id="30010008" subtype="man_spc_id" type="BMC">Evolution</classification>
</classifications>
</meta><bdy>
<sec>
<st>
<p>Background</p>
</st>
<p>The social amoebae have been used to study mechanisms of eukaryotic cell chemotaxis and cell differentiation for over 70 years. The completion of the <it>Dictyostelium discoideum </it>genome sequence provided a wealth of information about the basic cell and developmental biology of these organisms and highlighted an unexpected similarity between the cell motility and signaling systems of the social amoebae and the metazoa <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. For example, the <it>D. discoideum </it>genome encodes numerous G-protein coupled receptors (GPCRs) of the frizzled/smoothened, metabotropic glutamate, and secretin families that were previously thought to be specific to animals, suggesting that the GPCR gene families branched prior to the animal/fungal split. Numerous other examples, such as SH2 domain based phosphoprotein signaling, the full complement of ATP-binding cassette (ABC) transporter gene families, and the apparently complex actin cytoskeleton, served to strengthen the idea that amoeba and amoeboid animal cells are related in a more fundamental way than one might have guessed based on their gross physiological traits. We compared the <it>D. discoideum </it>genome with a second dictyostelid genome, that of <it>Dictyostelium purpureum</it>, in order to determine the set of genes they share, as well as their genomic differences that might illuminate variations in physiology within the social amoeba.</p>
<p>The Amoebozoa are closely related to the opisthokonts (animals and fungi) and include unicellular amoebae (for example, <it>Acanthamoeba castellani</it>), obligate parasitic amoeba (for example, <it>Entamoeba histolytica</it>), the true slime molds (for example, <it>Physarum polycephalum</it>) and the social amoebae, or Dictyostelia (often incorrectly referred to as 'slime molds'). In the 10 years since the monophyly of the Amoebozoa was proposed <abbrgrp>
<abbr bid="B2">2</abbr>
</abbrgrp>, genomic-scale analysis has confirmed the hypothesis <abbrgrp>
<abbr bid="B3">3</abbr>
</abbrgrp> and the phylogenetic relationships between the major amoeboid lineages have been clarified <abbrgrp>
<abbr bid="B4">4</abbr>
<abbr bid="B5">5</abbr>
<abbr bid="B6">6</abbr>
</abbrgrp>. A molecular phylogeny of the Dictyostelia has been constructed and suggests four major groups; the basal, group 1 parvisporids that produce small spores; the group 2 heterostelids; the group 3 rhizostelids; and the group 4 dictyostelids, which include <it>D. purpureum </it>and the well-studied <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B7">7</abbr>
</abbrgrp>. The dictyostelid group contains the largest number of described species of social amoeba and all of them produce large fruiting bodies with single sori, containing oblong spores, held aloft on a single cellular stalk.</p>
<p>
<it>D. purpureum </it>differs from <it>D. discoideum </it>in a number of developmental and morphological ways <abbrgrp>
<abbr bid="B8">8</abbr>
</abbrgrp>. In particular, during the social stage, <it>D. discoideum </it>delays irreversible commitment by cells to sterile stalk tissue until slug migration is complete. <it>D. purpureum</it>, by contrast, forms a stalk of dead cells as the slug moves towards light, increasing its ability to cross gaps <abbrgrp>
<abbr bid="B9">9</abbr>
</abbrgrp>. In addition, <it>D. purpureum </it>makes taller fruiting bodies with smaller spores than <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B7">7</abbr>
</abbrgrp>. <it>D. purpureum </it>fruiting bodies are purple with a triangular base formed from specialized stalk cells, whereas <it>D. discoideum </it>fruiting bodies are yellow and supported by a basal disc. <it>D. purpureum </it>also exhibits greater sorting into kin groups in the social stage than does <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B10">10</abbr>
<abbr bid="B11">11</abbr>
</abbrgrp>.</p>
<p>The <it>D. discoideum </it>genome sequence was the first amoebozoan genome to become available, and the deduced gene list improved our understanding of the facultative multicellular lifestyle of the social amoeba <abbrgrp>
<abbr bid="B1">1</abbr>
<abbr bid="B12">12</abbr>
</abbrgrp>. Here we present our initial analysis of the <it>D. purpureum </it>genome and compare it to the <it>D. discoideum </it>genome. Since these two species represent the two major clades of the group 4 dictyostelids, a comparison of their genomes has revealed much of the genomic diversity and conservation within this group of social amoebae. Overall, the two genomes are similar in size and gene content, sharing at least 7,619 orthologous protein coding genes and many more paralogous genes. A global analysis of sequence divergence suggests that the genetic diversity of the dictyostelids is similar to that of the vertebrates, from the bony fishes to the mammals. Some large gene families are nearly completely conserved between these two dictyostelids, while others have markedly diverged. Our analyses highlight general characteristics that are conserved among the dictyostelids, as well as potential differences, linking the genomic potential with the physiology of these soil microbes.</p>
</sec>
<sec>
<st>
<p>Results and Discussion</p>
</st>
<sec>
<st>
<p>Structure and comparative genomics of the <it>D. purpureum </it>genome</p>
</st>
<sec>
<st>
<p>Genome assembly</p>
</st>
<p>The genome of <it>D. purpureum </it>strain DpAX1, an axenic derivative of QSDP1, was sequenced using a whole genome shotgun sequencing approach (see Materials and methods) and assembled into 1,213 contigs arranged into 799 scaffolds with 240 larger than 50 kb (Additional file <supplr sid="S1">1</supplr>). There were 12,410 genes predicted and annotated using the JGI annotation pipeline (see Materials and methods); these are available from the JGI Genome Portal <abbrgrp>
<abbr bid="B13">13</abbr>
</abbrgrp> and from dictyBase <abbrgrp>
<abbr bid="B14">14</abbr>
</abbrgrp>. Thirty-three percent of the genes were supported by at least one EST clone and 89% of genes displayed some similarity to a gene in the NCBI non-redundant gene databases (Additional file <supplr sid="S1">1</supplr>). The genome size, gene count and average gene structure are very similar to those of <it>D. discoideum </it>(Table <tblr tid="T1">1</tblr>). Moreover, a recent comparative transcriptome analysis of <it>D. purpureum </it>and <it>D. discoideum</it>, using 'RNA-sequence' (RNA-seq), provides evidence for the transcription of 7,619 genes encoding protein orthologs within these species, or approximately 61% of the predicted <it>D. purpureum </it>genes <abbrgrp>
<abbr bid="B15">15</abbr>
</abbrgrp>.</p>
<suppl id="S1">
<title>
<p>Additional file 1</p>
</title>
<text>
<p>
<b>Supplementary text, figures and tables</b>. Supplementary text, figures and tables that include many details of the genome annotation.</p>
</text>
<file name="gb-2011-12-2-r20-S1.DOC">
   <p>Click here for file</p>
</file>
</suppl>
<tbl id="T1"><title><p>Table 1</p></title><caption><p>Comparison between the predicted protein coding genes of <it>D. purpureu</it><it>m </it>and <it>D. discoideu</it><it>m</it></p></caption><tblbdy cols="3">
      <r>
         <c ca="left">
            <p>
               <b>Feature</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>
                  <it>D. purpureum</it>
               </b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>
                  <it>D. discoideum</it>
               </b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
      </r>
      <r>
         <c cspan="3">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Genome size (Mb)</p>
         </c>
         <c ca="center">
            <p>33</p>
         </c>
         <c ca="center">
            <p>34</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Number of genes</p>
         </c>
         <c ca="center">
            <p>12,410</p>
         </c>
         <c ca="center">
            <p>13,541</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Gene density (kb per gene)</p>
         </c>
         <c ca="center">
            <p>2.66</p>
         </c>
         <c ca="center">
            <p>2.5</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Mean gene length (nucleotides)</p>
         </c>
         <c ca="center">
            <p>1,760</p>
         </c>
         <c ca="center">
            <p>1,756</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Intron per gene (spliced genes)</p>
         </c>
         <c ca="center">
            <p>1.51</p>
         </c>
         <c ca="center">
            <p>1.9</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Mean intron length (nucleotides)</p>
         </c>
         <c ca="center">
            <p>177</p>
         </c>
         <c ca="center">
            <p>146</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Mean protein length (amino acids)</p>
         </c>
         <c ca="center">
            <p>483</p>
         </c>
         <c ca="center">
            <p>518</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p><sup>a</sup>From <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>.</p>
   </tblfn></tbl>
</sec>
<sec>
<st>
<p>Repetitive elements and simple sequence repeats</p>
</st>
<p>The <it>D. purpureum </it>genome contains 1.1 Mb of transposons (3.4%), fewer than in D. discoideum. The largest families of transposons are Gypsy (approximately 400 kb, 35.8% of total transposons), Mariner (approximately 186 kb, 16.7%), MSAT1_Dpu (126 kb, 11.4%), and hAT (105 kb, 9.5%).</p>
<p>The previously sequenced <it>D. discoideum </it>genome showed an unusually high number, length, and density of simple sequence repeats, including triplet repeats that code for amino acid homopolymers <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. If unopposed by selection, simple sequence repeats can accumulate in genomes because of their high mutation rates and mutation to different repeat numbers that occur by misalignment and slippage during replication <abbrgrp>
<abbr bid="B16">16</abbr>
</abbrgrp>. They are often thought of as non-functional 'junk' DNA, though some are known to be functional <abbrgrp>
<abbr bid="B17">17</abbr>
</abbrgrp>, and the expansion of some triplet repeats in humans are known to cause disease when the number of repeats exceeds a particular threshold <abbrgrp>
<abbr bid="B18">18</abbr>
</abbrgrp>. Despite its considerable evolutionary distance from <it>D. discoideum </it>(see below), <it>D. purpureum </it>also has a considerable density of simple sequence repeats (Figure <figr fid="F1">1a</figr>). Simple sequence repeats comprise 4.4% of the <it>D. purpureum </it>genome, compared to 11% in <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. There are fewer long repeats that exceed 100 bp in length; 54 in <it>D. purpureum </it>compared to 1,436 in <it>D. discoideum</it>. The lower proportion of simple repeats in the <it>D. purpureum </it>genome and their shorter length may be due to current status of the assembly relative to the <it>D. discoideum </it>genome, since these repeats are difficult to assemble. Dinucleotide repeats, often the most common repeat in other species, are comparatively rare in both dictyostelid genomes (Figure <figr fid="F1">1b</figr>) <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>.</p>
<fig id="F1"><title><p>Figure 1</p></title><caption><p>Number of occurrences of simple sequence repeats in <it>D. purpureum </it>and <it>D. discoideum </it>genomes</p></caption><text>
   <p><b>Number of occurrences of simple sequence repeats in <it>D. purpureum </it>and <it>D. discoideum </it>genomes</b>. <b>(a,b) </b>The numbers of repeats were classified by the length of repeat tracts (a) and the length of repeat units (b). The <it>D. purpureum </it>genome (circles) has fewer and shorter microsatellites than the <it>D. discoideum </it>genome (triangles) in both coding regions (solid circles and triangles, and solid lines) and non-coding regions (open circles and triangles, and dashed lines). Not shown are three <it>D. discoideum </it>repeats above 250 nucleotides in (a). The minimum number of repeats of the unit motif was 10 repeats for mononucleotides, 7 repeats for dinucleotides, 5 repeats for trinucleotides, 4 repeats for tetranucleotides, 3 repeats for pentanucleotides and longer (6- to 20-nucleotide) motifs.</p>
</text><graphic file="gb-2011-12-2-r20-1"/></fig>
</sec>
<sec>
<st>
<p>Amino acid homopolymers</p>
</st>
<p>One of the most distinctive characteristics of the <it>D. discoideum </it>genome is the extreme abundance of amino acid homopolymers within coding sequences <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. As in <it>D. discoideum</it>, simple sequence repeats are common in <it>D. purpureum </it>coding sequences (Figure <figr fid="F1">1a</figr>), particularly those with repeat motifs of three nucleotides or multiples of three (Figure <figr fid="F1">1b</figr>). These types of repeats contribute to many amino acid homopolymers (Figure S1 in Additional file <supplr sid="S1">1</supplr>), including 2,645 that are longer than expected by chance (&gt;5 to &gt;9 residues, depending on the amino acid; Table S1 in Additional file <supplr sid="S1">1</supplr>). Though the abundance and density is lower than in <it>D. discoideum</it>, the relative abundance of different amino acids repeats in <it>D. purpureum </it>is very similar, with asparagine and glutamine repeats dominating, followed by serine and threonine (Figure <figr fid="F2">2a</figr>). The correlation between the two species in the densities of different amino acid repeats is 0.997 (Pearson's correlation coefficient, <it>P </it>&lt; 0.001), much higher than either species' correlation with <it>Saccharomyces cerevisiae </it>(0.516 for <it>D. discoideum</it>, and 0.486 for <it>D. purpureum</it>), or with <it>Drosophila melanogaster </it>(0.241 and 0.238). However, the correlations are also high for the densities of amino acid repeats with the A/T-rich protist <it>Plasmodium falciparum </it>(0.917 and 0.923), in agreement with a study showing that A/T content exerts a major influence on which amino acid repeats accumulate and persist within genomes <abbrgrp>
<abbr bid="B19">19</abbr>
</abbrgrp>.</p>
<fig id="F2"><title><p>Figure 2</p></title><caption><p>Densities of different homopolymer amino acid repeats in <it>D. purpureum </it>and <it>D. discoideum</it></p></caption><text>
   <p><b>Densities of different homopolymer amino acid repeats in <it>D. purpureum </it>and <it>D. discoideum</it></b>. <b>(a) </b>The density of each kind of amino acid repeat was calculated by summing the lengths of non-random repeats of that amino acid (Table S1 in Additional file <supplr sid="S1">1</supplr>) over protein sequences of all genes from <it>D. purpureum </it>and <it>D. discoideum</it>, dividing by the total length of coding sequence, and multiplying by 1,000. Letters indicate which amino acid each point represents. The Pearson's correlation coefficient between them is 0.997, <it>P </it>&lt; 0.001. <b>(b) </b>Mean (&#177; standard error) non-synonymous substitution rates (dNs) of genes with and without amino acid repeats. The non-synonymous substitution rates were calculated between orthologs (excluding repeat sequences) of <it>D. purpureum </it>and <it>D. discoideum</it>. Orthologs without amino acid repeats have significantly lower dN than orthologs with repeats in either <it>D. discoideum </it>and <it>D. purpureum </it>(Students <it>t</it>-test, both tests <it>P </it>&lt; 0.0001). Error bars show standard errors of the means.</p>
</text><graphic file="gb-2011-12-2-r20-2"/></fig>
<p>Codon usage within these amino acid homopolymers is quite similar to codon usage for the same amino acids outside of repeats, with a pattern quite similar to <it>D. discoideum </it>(Figure S2 in Additional file <supplr sid="S1">1</supplr>). Again, as in <it>D. discoideum</it>, many amino acid homopolymers contain a single codon, consistent with the relatively recent expansion of those triplet repeats. However, the codon diversity of <it>D. purpureum </it>amino acid repeats is significantly higher than it is for <it>D. discoideum </it>(Figure S3 in Additional file <supplr sid="S1">1</supplr>), consistent with the <it>D. discoideum </it>repeats being younger, with less time to accumulate changes from the original codon.</p>
<p>The potential function of most amino acid repeats is unknown, but the availability of the <it>D. purpureum </it>genome permits some new tests. If amino acid repeats are generally functionally important, they should tend to be conserved in their position within orthologous proteins. Sixty-four percent of the 2,645 <it>D. purpureum </it>amino acid repeats and 68% of the 11,243 <it>D. discoideum </it>repeats occur in genes that do not have homologs in the other species. Even in those with orthologs, only 19% of <it>D. purpureum </it>repeats and 5% of the <it>D. discoideum </it>repeats appeared to be homologous within global alignments of their respective proteins. The count of homologous repeats would be higher if we included matches where at least one falls below the threshold expectation for non-random homopolymers (for example, a match between 25 asparagines in <it>D. discoideum </it>and 8 in <it>D. purpureum </it>would be excluded as a chance event; <it>P </it>&gt; 0.01; Table S1 in Additional file <supplr sid="S1">1</supplr>). On the other hand, some could be fortuitous matches forced by a large number of repeated amino acids that are not truly homologous. Inspection of selected sequences shows at least some that appear to be convincing homologs, with strong identity on both sides of the repeat (Figure S4 in Additional file <supplr sid="S1">1</supplr>). Still, the apparent small fraction of homologous repeats suggests that the very similar patterns of amino acid homopolymer abundance and distribution do not come primarily from conserved ancestral repeats. Instead they may come from some shared physiological properties - perhaps distinctive DNA polymerases or repair enzymes or high AT-content - that generate similar patterns independently.</p>
<p>In addition to the lack of homology for amino acid homopolymers between <it>D. discoideum </it>and <it>D. purpureum</it>, several pieces of evidence suggest that these triplet repeats may be 'junk' that accumulates due to weak selection on proteins that are relatively unimportant for fitness. For genes that have homologs in the two species, those with amino acid repeats in either species have higher non-synonymous substitution rates in the non-repeat regions, as expected if genes with repeats are generally less subject to purifying selection (Figure <figr fid="F2">2b</figr>). Another indicator of the degree of selective constraint on a gene is its expression level, particularly in the single-celled, vegetative stage where the selective pressure is likely to be the greatest. If amino acid repeats accumulate in genes where selective constraints are low, we would predict that they will be more common in genes expressed in the social or developmental stages, as opposed to vegetative stages. Using the recent comparison of the transcriptional profiles of <it>D. discoideum </it>and <it>D. purpureum </it>development by RNA-seq analysis <abbrgrp>
<abbr bid="B15">15</abbr>
</abbrgrp>, this prediction is confirmed (Figure S5a,c in Additional file <supplr sid="S1">1</supplr>). Similarly, we would predict, looking only at RNA-seq reads from the vegetative stage, that genes coding for amino acid repeats would be less abundant and this is also confirmed (Figure S5b,d in Additional file <supplr sid="S1">1</supplr>). In sum, although a small number of repeats appear to be conserved over long periods of time, most appear to have arisen relatively recently in genes where selection against amino acid changes is weak.</p>
</sec>
<sec>
<st>
<p>Phylogeny of <it>D. purpureum</it>
</p>
</st>
<p>A phylogeny based on small subunit ribosomal RNA gene sequences places <it>D. purpureum </it>and <it>D. discoideum </it>into distinct clades within the most derived of the four groups of social amoebae, the group 4 dictyostelids <abbrgrp>
<abbr bid="B7">7</abbr>
</abbrgrp>. Thus, these two species should represent much of the diversity of the group. We constructed a global phylogeny of representative plant, animal, fungal and amoebal species, based on 389 orthologous gene clusters, in order to estimate the divergence of <it>D. purpureum </it>and <it>D. discoideum </it>relative to other eukaryotes (Figure <figr fid="F3">3</figr>). This analysis suggests that the group 4 dictyostelids span a comparable degree of protein sequence divergence as occurs among vertebrate species ranging from the bony fishes to the mammals. Recent comprehensive analyses of orthologous protein clusters from complete predicted proteomes suggests that the rates of protein evolution in the Amoebozoa are comparable to those of the plants and animals <abbrgrp>
<abbr bid="B20">20</abbr>
</abbrgrp>. If gene sequence evolution occurs at the same rate in the two groups, these two observations suggest that <it>D. purpureum </it>and <it>D. discoideum </it>shared a common ancestor approximately 400 million years ago.</p>
<fig id="F3"><title><p>Figure 3</p></title><caption><p>Phylogeny of the dictyostelids</p></caption><text>
   <p><b>Phylogeny of the dictyostelids</b>. Orthologs (389) defined by pairwise genome comparisons for reciprocal best hits using BLASTP from human <abbrgrp><abbr bid="B100">100</abbr></abbrgrp> versus each of <it>Oryzias latipes </it><abbrgrp><abbr bid="B100">100</abbr></abbrgrp>, <it>Gallus gallus </it><abbrgrp><abbr bid="B100">100</abbr></abbrgrp>, <it>Branchiostoma floridae </it><abbrgrp><abbr bid="B101">101</abbr></abbrgrp>, <it>Nematostella vectensis </it><abbrgrp><abbr bid="B28">28</abbr></abbrgrp>, <it>Neurospora crassa </it>(Broad release 7) <abbrgrp><abbr bid="B102">102</abbr></abbrgrp>, <it>Arabidopsis thaliana </it>(TAIR8) <abbrgrp><abbr bid="B103">103</abbr></abbrgrp>, <it>Chlamydomonas reinhardtii </it><abbrgrp><abbr bid="B104">104</abbr></abbrgrp>, <it>Dictyostelium discoideum </it><abbrgrp><abbr bid="B14">14</abbr></abbrgrp>, plus <it>D. discoideum </it>versus each of <it>D. purpureum</it>, and <it>Entamoeba histolytica </it><abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. A concatenated alignment of the orthologs was analyzed with mrBayes 3.1.2 using the WAG model, I + Gamma for 100,000 generations, with the first 50% of sampled trees discarded. The resulting consensus tree was rooted at the midpoint of the branch connecting the green plants to the rest of the tree.</p>
</text><graphic file="gb-2011-12-2-r20-3"/></fig>
</sec>
<sec>
<st>
<p>Horizontal gene transfer</p>
</st>
<p>The initial description of the <it>D. discoideum </it>genome included 18 genes that were proposed to be horizontal gene transfer (HGT) events from bacterial species <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. After 5 years of refinement of the underlying genome sequence, 16 <it>D. discoideum </it>genes remain potential HGT events. They have not been recognized in the characterized plant, animal or fungal genomes, and each of them is phylogenetically embedded within a bacterial clade. In addition, the thymidylate synthase gene, <it>thyA</it>, has been confirmed as an HGT; it is present only in a minority of the described bacterial species and is structurally unrelated to the canonical eukaryotic thymidylate synthase <abbrgrp>
<abbr bid="B21">21</abbr>
</abbrgrp>. To narrow the time frame wherein the HGT events might have occurred, we searched the <it>D. purpureum </it>genome for orthologs to these genes. Each of the proposed <it>D. discoideum </it>HGT genes have an ortholog in the <it>D. purpureum </it>genome (Table <tblr tid="T2">2</tblr>). This suggests that all 16 of these potential HGT events occurred after the divergence of the Amoebozoa from the plants and animals, but prior to the radiation of the group 4 dictyostelids.</p>
<tbl id="T2"><title><p>Table 2</p></title><caption><p>Candidate horizontal gene transfers from Bacteria</p></caption><tblbdy cols="6">
      <r>
         <c ca="left">
            <p>
               <b>Pfam domain</b>
               <sup>
                  <b>a</b>
               </sup>
            </p>
         </c>
         <c ca="left">
            <p>
               <b>Function in bacteria</b>
               <sup>
                  <b>b</b>
               </sup>
            </p>
         </c>
         <c ca="left">
            <p>
               <b><it>D. discoideum </it>dictyBase ID</b>
               <sup>
                  <b>c</b>
               </sup>
            </p>
         </c>
         <c ca="left">
            <p>
               <b>Function in <it>D. discoideum</it></b>
               <sup>
                  <b>c</b>
               </sup>
            </p>
         </c>
         <c ca="left">
            <p>
               <b><it>D. purpureum </it>protein ID</b>
               <sup>
                  <b>d</b>
               </sup>
            </p>
         </c>
         <c ca="left">
            <p>
               <b><it>D. purpureum </it>dictyBase ID</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Beta_elim_lyase</p>
         </c>
         <c ca="left">
            <p>Aromatic amino acid lyase</p>
         </c>
         <c ca="left">
            <p>DDB_G0281127</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>154359</p>
         </c>
         <c ca="left">
            <p>DPU_G0057350</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>BioY</p>
         </c>
         <c ca="left">
            <p>Biotin metabolism</p>
         </c>
         <c ca="left">
            <p>DDB_G0292424</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>79107</p>
         </c>
         <c ca="left">
            <p>DPU_G0053374</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Cna_B</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>DDB_G0292696</p>
         </c>
         <c ca="left">
            <p><it>colA</it>, Colossin A slug protein</p>
         </c>
         <c ca="left">
            <p>96318</p>
         </c>
         <c ca="left">
            <p>DPU_G0069302</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Peroxidase</p>
         </c>
         <c ca="left">
            <p>Dyp_peroxidase</p>
         </c>
         <c ca="left">
            <p>DDB_G0273083</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>35644</p>
         </c>
         <c ca="left">
            <p>DPU_G0056076</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Endotoxin_N</p>
         </c>
         <c ca="left">
            <p>Insecticidal crystal protein</p>
         </c>
         <c ca="left">
            <p>DDB_G0289249</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>96621</p>
         </c>
         <c ca="left">
            <p>DPU_G0058298</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>IPT</p>
         </c>
         <c ca="left">
            <p>Isopentenyl transferase</p>
         </c>
         <c ca="left">
            <p>DDB_G0277215</p>
         </c>
         <c ca="left">
            <p>Discadenine production</p>
         </c>
         <c ca="left">
            <p>92712</p>
         </c>
         <c ca="left">
            <p>DPU_G0062048</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>IucA_IucC</p>
         </c>
         <c ca="left">
            <p>Siderophore synthesis</p>
         </c>
         <c ca="left">
            <p>DDB_G0294004</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>No model<sup>e</sup></p>
         </c>
         <c ca="left">
            <p>No model<sup>e</sup></p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>OsmC</p>
         </c>
         <c ca="left">
            <p>Osmoregulation</p>
         </c>
         <c ca="left">
            <p>DDB_G0268884</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>93234</p>
         </c>
         <c ca="left">
            <p>DPU_G0070822</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Peptidase S13</p>
         </c>
         <c ca="left">
            <p>Dipeptidase/&#946;-lactamase</p>
         </c>
         <c ca="left">
            <p>DDB_G0271902</p>
         </c>
         <c ca="left">
            <p>Penicillin-sensitive carboxypeptidase</p>
         </c>
         <c ca="left">
            <p>6688</p>
         </c>
         <c ca="left">
            <p>DPU_G0063426</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>PP_kinase</p>
         </c>
         <c ca="left">
            <p>Polyphosphate synthesis</p>
         </c>
         <c ca="left">
            <p>DDB_G0293524</p>
         </c>
         <c ca="left">
            <p>Polyphosphate synthesis</p>
         </c>
         <c ca="left">
            <p>45674</p>
         </c>
         <c ca="left">
            <p>DPU_G0062710</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>TerD</p>
         </c>
         <c ca="left">
            <p>Tellurium resistance</p>
         </c>
         <c ca="left">
            <p>DDB_G0277501</p>
         </c>
         <c ca="left">
            <p>capA/B</p>
         </c>
         <c ca="left">
            <p>57536</p>
         </c>
         <c ca="left">
            <p>DPU_G0062378</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>Thy1</p>
         </c>
         <c ca="left">
            <p>Thymidylate synthesis</p>
         </c>
         <c ca="left">
            <p>DDB_G0280045</p>
         </c>
         <c ca="left">
            <p>thyA, thymidylate synthesis</p>
         </c>
         <c ca="left">
            <p>149635</p>
         </c>
         <c ca="left">
            <p>DPU_G0069806</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>DUF885</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>DDB_G0278355</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>155362</p>
         </c>
         <c ca="left">
            <p>DPU_G0059974</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>DUF1121</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>DDB_G0277411</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>39626</p>
         </c>
         <c ca="left">
            <p>DPU_G0062812</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>DUF1289</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>DDB_G0282477</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>27078</p>
         </c>
         <c ca="left">
            <p>DPU_G0056950</p>
         </c>
      </r>
      <r>
         <c ca="left">
            <p>DUF1294</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>DDB_G0285825</p>
         </c>
         <c ca="left">
            <p>Unknown</p>
         </c>
         <c ca="left">
            <p>86664</p>
         </c>
         <c ca="left">
            <p>DPU_G0067456</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p><sup>a</sup>The Pfam domain designation <abbrgrp><abbr bid="B99">99</abbr></abbrgrp>. <sup>b</sup>Confirmed or proposed function of the prokaryotic ortholog is given. <sup>c</sup>The <it>D. discoideum </it>gene ID number and functional annotation are from dictyBase <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. <sup>d</sup><it>D. purpureum </it>ortholog protein ID numbers <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. All orthologs are 90 to 100% similar in amino acid sequence to the <it>D. discoideum </it>protein over >90% of their length. <sup>e</sup>A related sequence is present, but no protein model could be produced from the current assembly.</p>
   </tblfn></tbl>
<p>Functional information now exists for 6 of the 16 proposed HGT genes and it is interesting to see how the dictyostelids have utilized these contributions from bacteria. ThyA has completely replaced an essential enzyme in central metabolism <abbrgrp>
<abbr bid="B21">21</abbr>
</abbrgrp>. Since it is also present in the amoebozoan slime mold <it>Physarum polycephalum </it>(GenBank accession number [GenBank:<ext-link ext-link-id="AAY87038" ext-link-type="gen">AAY87038</ext-link>] <abbrgrp>
<abbr bid="B22">22</abbr>
</abbrgrp>), the change over to the rare bacterial enzyme must have taken place quite early in the radiation of the amoebozoa. The isopentenyl transferase, IptA, produces discadenine, which is a sporulation inducer and spore germination inhibitor <abbrgrp>
<abbr bid="B23">23</abbr>
</abbrgrp>. Another gene, <it>pscA</it>, encodes an active penicillin-sensitive peptidase but its function is not known <abbrgrp>
<abbr bid="B24">24</abbr>
</abbrgrp>, and Ppk1 is a bacterial type polyphosphate synthase <abbrgrp>
<abbr bid="B25">25</abbr>
</abbrgrp>. Colossin A (ColA) appears to be a structural protein of the slug that was fashioned out of hundreds of repeats of a bacterial Cna_B domain <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. CapA and CapB are two cAMP-binding proteins whose carboxy-terminal half is derived from a subunit of a bacterial tellurium resistance complex <abbrgrp>
<abbr bid="B26">26</abbr>
</abbrgrp>. Recently, CapB was identified in a proteomic screen for centrosomal proteins <abbrgrp>
<abbr bid="B27">27</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Conserved gene order between the <it>D. purpureum </it>and <it>D. discoideum </it>genomes</p>
</st>
<p>Genomes evolve through base substitution and insertion/deletion, and also through rearrangements that alter the order and orientation of genes on chromosomes. Synteny, the nature and extent of conserved gene order between species, serves as an important gauge of the dynamics of genome evolution <abbrgrp>
<abbr bid="B28">28</abbr>
</abbrgrp>. To characterize the potential synteny between <it>D. purpureum </it>and <it>D. discoideum</it>, we identified blocks of approximately conserved gene order between their genomes, and compared the number and sizes of these potential conserved syntenic blocks to control genomes in which the gene orders were artificially scrambled. Although the <it>D. purpureum </it>genome is not fully assembled, the current level of contiguity allows for an analysis of conserved gene order on a small scale (approximately 50 kb). Blocks of potential synteny were constructed by single-linkage clustering of <it>D. purpureum </it>genes, where pairs of genes are considered linked if (i) they fall on the same scaffold of the assembly with at most <it>w </it>intervening genes that have <it>D. discoideum </it>orthologs, and (ii) their <it>D. discoideum </it>orthologs all fall on a single chromosome, with no more than <it>w </it>intervening genes that have <it>D. purpureum </it>orthologs. For stretches of perfectly conserved gene order (blocks constructed with <it>w </it>= 0), 4,734 (63%) of the 1:1 ortholog pairs used in the analysis lie in a genomic block of conserved gene order involving at least two genes in each genome. The mean size of such blocks is 2.8 genes in each genome, with the longest perfectly conserved stretch containing 10 genes.</p>
<p>To determine the maximum length scale over which significant conservation of gene order persists, we compared the increase in potential syntenic clusters as a function of an increasing number of intervening genes (<it>w</it>) for <it>D. purpureum </it>versus <it>D. discoideum </it>to the rate obtained for the permutation controls (Figure S6 in Additional file <supplr sid="S1">1</supplr>). We found that for up to about 15 intervening genes, potential conserved gene clusters grow significantly faster than what is expected for the same two genomes with randomized gene orders, which provides a conservative threshold for identifying blocks of conserved gene order. With this estimate, 76% of orthologous gene pairs participate in a block of approximately conserved gene order, compared to 5.8 &#177; 0.4% in controls, with a false positive rate, on a gene-by-gene basis, of approximately 7%. The 5,793 genes contained in these blocks, and their positions in the genome, are listed in Additional file <supplr sid="S2">2</supplr>. This indicates that the majority of orthologs in <it>D. purpureum </it>and <it>D. discoideum </it>are found in small neighborhoods of exactly conserved gene order between the two species, and that these neighborhoods are themselves clustered into larger regions of approximately conserved gene order.</p>
<suppl id="S2">
<title>
<p>Additional file 2</p>
</title>
<text>
<p>
<b>Supplementary Table S2</b>. A table listing blocks of partially conserved gene order between the <it>D. discoideum </it>and <it>D. purpureum </it>genomes.</p>
</text>
<file name="gb-2011-12-2-r20-S2.DOC">
   <p>Click here for file</p>
</file>
</suppl>
</sec>
</sec>
<sec>
<st>
<p>Gene content comparisons of <it>D. purpureum </it>and <it>D. discoideum </it>genomes</p>
</st>
<sec>
<st>
<p>Non-coding RNA genes</p>
</st>
<p>The described catalog of non-coding RNAs (ncRNAs) in the Dictyostelia was long limited to tRNAs, rRNAs, and a handful of experimentally identified short RNAs, all found in <it>D. discoideum </it>(for review, see <abbrgrp>
<abbr bid="B29">29</abbr>
</abbrgrp>). Recent work has expanded this repertoire to include a family of spliceosomal ncRNAs and two classes (class I and class II) of novel ncRNAs <abbrgrp>
<abbr bid="B30">30</abbr>
<abbr bid="B31">31</abbr>
</abbrgrp>. The spliceosomal RNAs identified in <it>D. discoideum</it>, U1, U2, U4, U5, and U6, are each characterized by both specific RNA-binding motifs and the ability to fold into characterized secondary structures <abbrgrp>
<abbr bid="B30">30</abbr>
<abbr bid="B31">31</abbr>
</abbrgrp>. Using a modified BLAST search (Additional file <supplr sid="S1">1</supplr>), we have identified a set of <it>D. purpureum </it>spliceosomal homologs that are predicted to fold into the appropriate secondary structures (Table S3a in Additional file <supplr sid="S1">1</supplr>).</p>
<p>In <it>D. discoideum </it>a '<it>Dictyostelium </it>upstream sequence element' (DUSE) has been described that sits approximately 63 bp upstream of many ncRNAs, including the class I and II ncRNAs <abbrgrp>
<abbr bid="B31">31</abbr>
</abbrgrp>. Identification of the DUSE motif ([AT]CCCA[AT]AA) in <it>D. purpureum </it>revealed that a DUSE also sits upstream of all <it>D. purpureum </it>spliceosomal RNA genes. The DUSE also enriches for a family of putative <it>D. purpureum </it>ncRNAs that are homologous to the two novel classes of <it>D. discoideum </it>ncRNAs. This suggests that the DUSE is not specific to <it>D. discoideum</it>.</p>
<p>Operating under the assumption that the DUSE sits upstream of certain ncRNAs in <it>D. purpureum</it>, we sought to identify novel ncRNAs by focusing on DUSE-enriched 8-bp sequences (see Additional file <supplr sid="S1">1</supplr> for methods). Two of the three 8-mers that were found to be highly enriched, CCTTACAG and CTTACAGC, also occur in the novel classes of <it>D. discoideum </it>ncRNAs. These ncRNA gene products are 50 to 60 bp long and have distinct 5' and 3' sequences predicted to form 5-bp stem structures that are conserved within each class (Figure <figr fid="F4">4</figr>). Both classes share a 12-bp 'bulge' sequence, CCTTACAGCCAA, which is immediately 3' to the 5' stem sequence <abbrgrp>
<abbr bid="B30">30</abbr>
</abbrgrp>. This 'bulge' sequence is predicted to not bind with any other region of the ncRNA, thus constituting a non-self-binding region (NSBR). The two 8-mers both sit within this NSBR.</p>
<fig id="F4"><title><p>Figure 4</p></title><caption><p>Putative novel ncRNAs in <it>D. purpureum</it></p></caption><text>
   <p><b>Putative novel ncRNAs in <it>D. purpureum</it></b>. The sequences and predicted structures of select class I and II ncRNAs in both <it>D. discoideum </it>and <it>D. purpureum</it>. The red dots indicate base pair positions that possess high mutual information but lack sequence identity. This region contains the 5' and 3' stem sequences, which are conserved among each species but not between both. Blue dots indicate base positions where sequences are perfectly conserved, corresponding to the non-self-binding region (NSBR). The starred positions are connected via a variable sequence (green box in alignment), which lacks primary sequence or secondary structure conservation (see Figure S8 in Additional file <supplr sid="S1">1</supplr> for complete alignment).</p>
</text><graphic file="gb-2011-12-2-r20-4"/></fig>
<p>To identify putative homologs to the class I and II ncRNAs in <it>D. purpureum</it>, we used the structural characteristics of these ncRNAs to filter all sequences containing the DUSE-enriched 8-mers. Forty members of the class I and II ncRNAs were originally identified in <it>D. discoideum</it>. Some are described as putative, with nine lacking the canonical bulge sequence, and five others lacking an upstream DUSE, or having a degenerate DUSE. The class I ncRNAs have a 5' stem sequence of GTTGA, while two class II ncRNAs have a 5' stem sequence of GCTCG, and all members have a 3' stem sequence complementary to the 5' stem sitting 40 to 70 bp away from the 5' stem <abbrgrp>
<abbr bid="B29">29</abbr>
</abbrgrp>.</p>
<p>In our analysis of the masked <it>D. discoideum </it>genome, we identified 46 occurrences of the CTTACAGC 8-mer (Additional file <supplr sid="S1">1</supplr>). Of these, 26 possess both an upstream DUSE and a 5'/3' stem pair sitting 40 to 70 bp apart, and each corresponds to a previously identified class I or II ncRNA. In the masked <it>D. purpureum </it>genome there are 61 occurrences of the CCTTACAG 8-mer; 26 of these 8-mers have both an upstream DUSE and a 5'/3' stem pair consisting of an identical 5' sequence (GAATT) (Figure <figr fid="F4">4</figr>). These results suggest a class of ncRNAs in <it>D. purpureum </it>similar to the class I and II ncRNAs found in <it>D. discoideum</it>.</p>
<p>The comparative genomics approach to identifying these ncRNAs in <it>D. purpureum </it>lends deeper insight into their function. The 5' and 3' stem sequences have diverged between species, but have done so in a compensatory manner that maintains the predicted 5'/3' structure. The NSBR sequence, however, has remained perfectly conserved between species, and in neither species is it predicted to self-bind. This suggests a functional role for the NSBR beyond self-interaction, possibly as a binding site for another functional element. Initial genomic analysis of the dictyostelids <it>Dictyostelium citrinum </it>and <it>Polysphondylium </it>
<it>violaceum </it>also revealed putative ncRNAs with an upstream DUSE, the conserved NSBR sequence, a 5'/3' stem structure, but 5'/3' stem sequences different from those of <it>D. discoideum </it>and <it>D. purpureum </it>(unpublished data).</p>
</sec>
<sec>
<st>
<p>Determination of protein orthologs</p>
</st>
<p>Of the 12,410 predicted <it>D. purpureum </it>proteins, we identified 7,619 that are likely to be orthologous to <it>D. discoideum </it>proteins using the Inparanoid algorithm, best reciprocal blast hits, and manual curation (Additional file <supplr sid="S3">3</supplr>). An additional 2,759 predicted proteins are similar to genes in <it>D. discoideum</it>, while 2,001 appear to be unique to <it>D. purpureum </it>(Additional file <supplr sid="S4">4</supplr>). Thus, at least 84% of the protein-coding genes in <it>D. purpureum </it>share orthologs or paralogs in the <it>D. discoideum </it>genome. The gene product predictions from the <it>D. purpureum </it>genome should be enormously useful for further refinement of the predicted proteome of <it>D. discoideum</it>. Some gene families are completely conserved between <it>D. purpureum </it>and <it>D. discoideum</it>, with clear orthologs for every member of the family, while other families appear to have undergone considerable divergence between the two species (Figure S9 in Additional file <supplr sid="S1">1</supplr>, and Additional file <supplr sid="S4">4</supplr>). The differences amongst gene family members should illuminate the physiological differences between these two dictyostelids, whereas the similarities may indicate where the selective pressures, exerted by their common environment, have resulted in stable gene inventories required for survival.</p>
<suppl id="S3">
<title>
<p>Additional file 3</p>
</title>
<text>
<p>
<b>Supplementary Table S4</b>. A table listing the predicted orthologs that are shared between <it>D. discoideum </it>and <it>D. purpureum</it>.</p>
</text>
<file name="gb-2011-12-2-r20-S3.DOC">
   <p>Click here for file</p>
</file>
</suppl>
<suppl id="S4">
<title>
<p>Additional file 4</p>
</title>
<text>
<p>
<b>Supplementary Tables S5</b>. A table listing the predicted paralogs that are shared between <it>D. discoideum </it>and <it>D. purpureum</it>.</p>
</text>
<file name="gb-2011-12-2-r20-S4.DOC">
   <p>Click here for file</p>
</file>
</suppl>
</sec>
<sec>
<st>
<p>Polyketide synthases</p>
</st>
<p>Polyketide synthases (PKSs) are enzymatic production lines for making small molecules by the repeated condensation of malonyl-CoA and other thio-esters of coenzyme A (CoA). A large number of polyketides exist and are probably made for ecological purposes, but they also serve as model natural products for the development of drugs, antibiotics and food additives. Soil amoebae are not commonly regarded as polyketide producers, but they too must face complex ecological challenges, which could be met by polyketide production; competition from other amoebae, infection by bacteria and predation by nematodes, amoebae and fungi. A small number of potential eco-chemicals have been identified from social amoebae <abbrgrp>
<abbr bid="B32">32</abbr>
<abbr bid="B33">33</abbr>
</abbrgrp>, but the completed <it>D. discoideum </it>genome sequence revealed a much larger potential <abbrgrp>
<abbr bid="B1">1</abbr>
<abbr bid="B34">34</abbr>
<abbr bid="B35">35</abbr>
</abbrgrp>. These PKSs are large, modular proteins of 2,000 to 3,500 amino acids, each having a core of domains for the condensation reaction, together with optional domains for methylation, carbonyl reduction and product release. Two have a unique, 'steely', architecture in which a second PKS - a chalcone synthase - is fused to the carboxyl terminus of a modular PKS <abbrgrp>
<abbr bid="B36">36</abbr>
</abbrgrp>. One of these steely proteins makes the precursor of differentiation-inducing factor (DIF)-1, a chlorinated signal molecule for stalk cell differentiation <abbrgrp>
<abbr bid="B37">37</abbr>
</abbrgrp>, and the other a pyrone or an olivetol derivative <abbrgrp>
<abbr bid="B35">35</abbr>
<abbr bid="B36">36</abbr>
<abbr bid="B38">38</abbr>
</abbrgrp>.</p>
<p>The <it>D. purpureum </it>genome has 50 predicted PKS genes. We constructed phylogenetic trees using the highly conserved ketoacyl synthase and acyl transfer domains of the PKS genes from both species to discern evolutionary relationships (Figure <figr fid="F5">5a</figr>; see Table S6 in Additional file <supplr sid="S1">1</supplr> for corresponding genomic loci). The two steely genes within each species are only distantly related to each other but are clearly orthologous between species. This implies that both genes were present in the last common ancestor and that their function has been maintained in both species. There is also a clear ortholog in <it>D. purpureum </it>of the methyltransferase catalyzing the last step of DIF-1 biosynthesis <abbrgrp>
<abbr bid="B39">39</abbr>
</abbrgrp> and so <it>D. purpureum </it>is likely to make DIF-1, like <it>D. discoideum</it>, and <it>Dictyostelium mucoroides </it>
<abbrgrp>
<abbr bid="B40">40</abbr>
</abbrgrp>, another group 4 dictyostelid <abbrgrp>
<abbr bid="B7">7</abbr>
</abbrgrp>. Two other clear orthologous pairs of genes are apparent. <it>Dp2 </it>and the very similar <it>Dd1</it>/<it>Dd2 </it>likely encode fatty acid synthases based on their similarity to other fatty acid synthases and their high expression levels. <it>Dp12 </it>and <it>Dd3 </it>are of unknown function, though mutation of <it>Dd3 </it>causes a 'cheater' phenotype, suggesting that it may produce a developmental signal <abbrgrp>
<abbr bid="B41">41</abbr>
</abbrgrp>.</p>
<fig id="F5"><title><p>Figure 5</p></title><caption><p>Polyketide synthases and histidine kinases of <it>D. purpureum</it></p></caption><text>
   <p><b>Polyketide synthases and histidine kinases of <it>D. purpureum</it></b>. <b>(a) </b>The phylogram of putative polyketide synthases was constructed from the ketoacyl synthase and acyltransferase domains of each predicted protein. Red numbers indicate <it>D. discoideum </it>genes and blue numbers indicate <it>D. purpureum </it>genes, with the corresponding genomic loci given in Table S6 in Additional file <supplr sid="S1">1</supplr>. Orthologous genes are circled in grey; the steely (<it>stlA</it>, <it>stlB</it>) and the putative fatty acid synthase (<it>fas</it>) genes are indicated. <b>(b) </b>Unrooted phylogram of the putative histidine kinases and the AcrA protein of <it>D. discoideum </it>and <it>D. purpureum </it>(denoted with 'Dp' before the gene names). Bootstrap values at each node are given for 1,000 iterations of tree building. The red numbers indicate the percent amino acid sequence identity between each pair of predicted proteins. Note the striking one-to-one correspondence between each gene in the two species.</p>
</text><graphic file="gb-2011-12-2-r20-5"/></fig>
<p>In contrast to the four <it>D. purpureum </it>genes described above, most <it>D. purpureum </it>PKS genes do not have obvious orthologs in <it>D. discoideum</it>, indicating species-specific expansions. Given the overall gene conservation between these two species, the divergence of the PKS gene sets is striking. We speculate that this greater evolutionary fluidity reflects different selective pressures placed on the two species, perhaps by different competitor species in their ecological niches, and therefore that most of their polyketides are produced for ecological purposes.</p>
<p>The <it>D. purpureum </it>genome confirms the high potential of social amoebae for polyketide production. The relative paucity of orthologs to <it>D. discoideum </it>PKSs raises the possibility that polyketide production varies substantially from species to species amongst the dictyostelids. As natural products remain the major source of drugs <abbrgrp>
<abbr bid="B42">42</abbr>
</abbrgrp>, this diversity suggests that natural products of social amoebae deserve systematic exploration.</p>
</sec>
<sec>
<st>
<p>The ATP-binding cassette transporters</p>
</st>
<p>The ABC transporters are one of the largest protein superfamilies that are encoded by any genome. In stark contrast to the lineage-specific radiation of the PKS proteins, the complement of ABC transporters has remained remarkably stable since the divergence of <it>D. purpureum </it>and <it>D. discoideum</it>. ABC proteins all have a conserved domain of 200 to 250 amino acids, the ATP-binding cassette, and typically have 12 transmembrane domains. Seven different eukaryotic families have been defined on the basis of sequence homology, domain topology and function. The superfamily has been extensively analyzed in <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B43">43</abbr>
</abbrgrp> and this allowed a detailed comparison to the predicted <it>D. purpureum </it>ABC superfamily members. Both genomes carry similar numbers of ABC genes overall, but differences in gene number can be observed within groups of closely related genes belonging to the largest families (Tables S7 and S8 in Additional file <supplr sid="S1">1</supplr>). Only 58 genes can be considered clear orthologs; the remaining genes should be considered paralogs (Figure S10 in Additional file <supplr sid="S1">1</supplr>). These genes may play partially redundant roles and this might allow their sequences to drift to a point of uncertain orthology.</p>
<p>The Tag subfamily proteins (TagA-D) of the ABC B family have a novel domain structure with a serine protease domain on the amino terminus, a single set of six transmembrane domains, and one ABC domain on the carboxyl terminus. Three of the Tag proteins have defined roles in cell differentiation; TagA is involved in early cell fate determination <abbrgrp>
<abbr bid="B44">44</abbr>
</abbrgrp>, TagB is required for pre-stalk cell differentiation <abbrgrp>
<abbr bid="B45">45</abbr>
</abbrgrp>, and TagC is expressed in pre-stalk cells and required to process acyl-CoA binding protein into a spore differentiation peptide signal <abbrgrp>
<abbr bid="B46">46</abbr>
</abbrgrp>. Interestingly, TagA, B and C are conserved between <it>D. purpureum </it>and <it>D. discoideum</it>, but whereas the TagA orthologs are quite similar, the relationship between the TagB and TagC proteins in the two species is not as clear (they were named based on their gene order within a block of synteny between <it>D. discoideum </it>and <it>D. purpureum</it>).</p>
</sec>
<sec>
<st>
<p>Protein kinases</p>
</st>
<p>
<it>D. purpureum </it>has a similar complement of protein kinases compared to <it>D. discoideum</it>. Like <it>D. discoideum</it>, <it>D. purpureum </it>does not appear to have receptor tyrosine kinases, or other notable protein kinases such as P70, ATM, and PASK. There are 262 eukaryotic protein kinases and 41 atypical protein kinases, including potential pseudogenes (Table S9 in Additional file <supplr sid="S1">1</supplr>). This compares to 247 identified eukaryotic protein kinases and 39 atypical protein kinases in <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B47">47</abbr>
</abbrgrp>.</p>
<p>The 14 <it>D. purpureum </it>histidine kinase genes, and the related <it>acrA </it>gene, each have an unambiguous ortholog in <it>D discoideum </it>(Figure <figr fid="F5">5b</figr>). There is little homology between non-orthologous genes outside of the kinase domain. Thus, the histidine kinases appear to have diverged from a common ancestor before the radiation of the dictyostelids, suggesting that each one of them carries out a distinct and conserved function. The adenylyl cyclase of <it>D. discodeum</it>, AcrA, carries a non-functional histidine kinase domain with mutations in key amino acids that preclude kinase activity <abbrgrp>
<abbr bid="B48">48</abbr>
</abbrgrp>. This domain and its variations are well conserved in the <it>D. purpureum </it>AcrA, suggesting that there is a selective advantage to maintaining this non-catalytic domain, probably as a dimerization domain.</p>
<p>The catalytic subunit of cAMP dependent protein kinase (PKA), PkaC, in <it>D. purpureum </it>shows 65% amino acid identity with its <it>D. discoideum </it>ortholog. The homology is highest in the catalytic core and lowest in the low complexity amino-terminal domain, with the exception of the region encompassing the &#945;A amphipathic helix <abbrgrp>
<abbr bid="B49">49</abbr>
</abbrgrp>. This helix, which is predicted to interact with a hydrophobic pocket on the catalytic core of the enzyme, is 95% identical in these dictyostelids, which is suggestive of a conserved regulatory function. The regulatory subunit of PKA, PkaR, of <it>D. purpureum </it>and <it>D. discoideum </it>shows 79% amino acid identity and each of them lack the dimerization domain found in metazoa.</p>
</sec>
<sec>
<st>
<p>G-protein coupled receptors</p>
</st>
<p>GPCRs are found in all eukaryotes and transduce a variety of extracellular signals via heterotrimeric G-proteins and effector proteins inside the cell to elicit physiological responses. GPCRs are characterized by an extracellular domain, an intracellular domain, and a core domain that contains seven transmembrane regions. The GPCRs are subdivided into six major families that, aside from their conserved secondary domain structure, do not share significant sequence similarity. The <it>D. purpureum </it>genome encodes the same families of GPCRs as in <it>D. discoideum</it>, but has a reduced total number, which is mainly due to differences in the numbers of cAMP, family 3 and family 5 receptors (Figure S12 and Table S10 in Additional file <supplr sid="S1">1</supplr>). There are only two cAMP receptors in the <it>D. purpureum </it>genome, namely orthologs of <it>Dictyostelium </it>
<it>carA </it>and <it>carB</it>, but there are no orthologs of <it>carC </it>and <it>carD</it>. In addition, there are 35% fewer family 3 receptors and 40% fewer family 5 receptors. This difference must be due either to an expansion of family 3, 5 and cAR receptors in <it>D. discoideum </it>or to a reduction in the <it>D. purpureum </it>genome. Either <it>D. discoideum </it>has evolved many new functions for GPCRs compared to <it>D. purpureum </it>or else there is more functional overlap amongst the <it>D. discoideum </it>receptors.</p>
</sec>
<sec>
<st>
<p>Transcription factors</p>
</st>
<p>The overall comparison of transcription factors in <it>D. discoideum </it>and <it>D. purpureum </it>shows gross conservation both in the total number of genes in each family, and at the protein sequence level (Table S11 in Additional file <supplr sid="S1">1</supplr>). There are only 11 basic leucine zipper (bZIP) domains in <it>D. purpureum</it>, versus 19 in <it>D. discoideum</it>. Among the 11 bZIPs found in both species are DimA and DimB, which are involved in DIF signaling in <it>D. discoideum</it>, as well as bZIP candidates for CREB and GCN4, which are the most conserved bZIPs among eukaryotes (E. Huang, M. Katoh-Kurasawa and G. Shaulsky; unpublished). There are an equal number of STAT transcription factors in <it>D. purpureum </it>and <it>D. discoideum </it>(four), each with a high degree of protein sequence identity. In the original description of the <it>D. discoideum </it>genome, the paucity of transcription factors was noted <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. One explanation for the small number of recognized transcription factors was the possibility of new classes of transcription factors that evade conventional detection based on sequence searches. One example is the recently defined CudA nuclear protein that binds <it>in vivo </it>to the promoter of the <it>cotC </it>prespore gene <abbrgrp>
<abbr bid="B50">50</abbr>
</abbrgrp>. CudA-related proteins have recently been defined as being specific to the amoebozoa <abbrgrp>
<abbr bid="B51">51</abbr>
</abbrgrp>, but there are distantly related proteins in plants <abbrgrp>
<abbr bid="B50">50</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>The actin cytoskeleton and its regulation</p>
</st>
<p>The <it>D. purpureum </it>repertoire of microfilament system proteins is almost an exact replica of that described in <it>D. discoideum </it>(Table S12 in Additional file <supplr sid="S1">1</supplr>) <abbrgrp>
<abbr bid="B52">52</abbr>
</abbrgrp>. In contrast, the actin-depolymerizing factor (ADF) protein family differs between the <it>Dictyostelium </it>species. A phylogenetic tree of all ADF domains encoded by the genomes of both species shows three major groups (Figure S13 in Additional file <supplr sid="S1">1</supplr>). The ADF domains present in cofilin, twinfilin and GMF (glia maturation factor) constitute one group. <it>D. purpureum </it>has two genes encoding cofilins, <it>cofA </it>and <it>cofG</it>. Only <it>cofA </it>has a direct ortholog amongst the eight <it>D. discoideum </it>genes. An additional group of ADF domains is present in <it>D. purpureum </it>that includes three proteins, one of which (DPU_G0064410) has no direct ortholog in <it>D. discoideum </it>and another (DPU_G0060306) that is related to two <it>D. discoideum </it>genes (DDB_G0270134 and DDB_G0270132).</p>
<p>A family of proteins where there has been some expansion in <it>D. purpureum </it>is that of the I/LWEQ domain-containing proteins. Besides two talins and a single Sla2/HIP1, <it>D. purpureum </it>harbors three more genes related to <it>hipA </it>encoding only a carboxy-terminal fragment that encompasses the I/LWEQ domain. It is not clear whether these are actually pseudogenes. Similarly, we have found a group of at least eight genes that encode short proteins related to the carboxy-terminal part of HIP1 immediately upstream of the I/LWEQ domain. The extensive family of calponin homology (CH) domain proteins in <it>D. purpureum </it>has two members absent in <it>D. discoideum</it>. One (DPU_G0069574) is related to conventional fimbrins but lacks EF hands and has a weakly conserved fourth CH domain. The other (DPU_G0074288) is a protein with a carboxy-terminal CH domain.</p>
</sec>
<sec>
<st>
<p>Rho signaling</p>
</st>
<p>Cytoskeletal remodeling during chemotaxis and phagocytosis is regulated by a considerable number of upstream signaling components. Especially important are those components involved in signaling to and from small GTPases of the Rho family, as recently described in <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B53">53</abbr>
</abbrgrp>. In general terms the repertoire of genes encoding proteins that participate in Rho signaling is very similar in both dictyostelid species, with some exceptions (Tables S13 and S14 in Additional file <supplr sid="S1">1</supplr>). The Rho GTPase family itself has diversified considerably in <it>D. purpureum </it>and <it>D. discoideum </it>(Figure S14 in Additional file <supplr sid="S1">1</supplr>). This family currently comprises 20 <it>rac </it>genes and one pseudogene in <it>D. discoideum </it>and 18 genes in <it>D. purpureum</it>. Most <it>D. discoideum </it>
<it>rac </it>genes have a direct ortholog in <it>D. purpureum</it>, but the degree of conservation is variable. There is a second <it>rac1a</it>-related gene, indicating that the ancestral <it>rac1 </it>gene duplicated independently in each organism. There is no ortholog for <it>D. discoideum </it>
<it>rac1b</it>, <it>rac1c</it>, <it>racF1</it>, <it>racF2</it>, <it>racI </it>and <it>racM </it>to <it>racO</it>, and the pseudogene <it>racK </it>and, conversely, <it>D. purpureum </it>has five more <it>rac </it>genes without a <it>D. discoideum </it>counterpart (<it>racR </it>to <it>racW</it>), again indicating that the <it>rac </it>family has undergone independent divergence in both species.</p>
<p>Among the Rho regulators <it>D. purpureum </it>appears to have one RhoGAP gene less than <it>D. discoideum</it>. The missing RhoGAP gene is <it>gacII</it>; the corresponding protein consists of a RhoGAP domain followed by a SH3 domain. The protein is very similar to the amino-terminal half of RacGAP1 (<it>xacA </it>gene), suggesting that <it>gacII </it>resulted from a partial duplication of <it>xacA </it>in <it>D. discoideum</it>. Among the Rho effectors, the class PI4P 5 kinases have undergone a notable expansion in <it>D. purpureum </it>(Table S14 in Additional file <supplr sid="S1">1</supplr>). Additional descriptions of Ras superfamily members can be found in Additional file <supplr sid="S1">1</supplr>.</p>
</sec>
</sec>
<sec>
<st>
<p>The <it>D. purpureum </it>glycome</p>
</st>
<p>Glycosylation is an extensive post-translational modification of proteins, and also occurs on lipids, nucleic acids and, of course, polysaccharides, in all forms of life. Though basic glycosylation pathways tend to be conserved among eukaryotes, glycosylation details can vary between species and cell types, and even between individual proteins as 'microheterogeneities'. In <it>D. discoideum</it>, protein glycosylation has been implicated in protein sorting and stability, cell proliferation, adhesion and sorting, spore coat assembly, resistance to cisplatin, and oxygen signaling. The inventory of predicted glycogenes likely to be associated with both anabolic and catabolic aspects of glycan metabolism approaches 2.5% of the genome (Tables S16, S17, S18, and S19 in Additional file <supplr sid="S1">1</supplr>), typical for metazoans but lower than for higher plants. As discussed below, a comparison of <it>D. purpureum </it>with the previously annotated glycogenes of <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B54">54</abbr>
</abbrgrp>, in the context of the global CAZy classification <abbrgrp>
<abbr bid="B55">55</abbr>
<abbr bid="B56">56</abbr>
</abbrgrp>, suggests examples of both considerable conservation and diversification of their glycomes.</p>
<sec>
<st>
<p>N-linked glycosylation</p>
</st>
<p>Protein N-glycosylation, the most prevalent and highly conserved type of protein glycosylation, is initiated in the rough endoplasmic reticulum of <it>D. discoideum </it>by the transfer of a 14-sugar chain from a lipid-linked precursor <abbrgrp>
<abbr bid="B57">57</abbr>
</abbrgrp> that is identical to the yeast and human precursor but distinct from that of many protists <abbrgrp>
<abbr bid="B58">58</abbr>
</abbrgrp>. Maturation of the sugar chain leads to a preponderance of high-mannose glycans with bisecting and novel intersecting &#946;-linked GlcNAc, and &#945;3-linked core fucose characteristic of plants and invertebrates, followed by increased &#945;-mannosidase processing during development <abbrgrp>
<abbr bid="B59">59</abbr>
<abbr bid="B60">60</abbr>
</abbrgrp>. <it>D. discoideum </it>N-glycans are often rendered anionic by phosphorylation and sulfation <abbrgrp>
<abbr bid="B57">57</abbr>
<abbr bid="B59">59</abbr>
</abbrgrp>, in contrast to the typical sialic acid or uronic acid modifications of animal glycans.</p>
<p>A genomic comparison suggests that the N-glycome of <it>D. purpureum </it>will be similar to that of <it>D. discoideum </it>but with some interesting differences (Table S16 in Additional file <supplr sid="S1">1</supplr>). For example, putative CAZy GT49 &#946;3-GlcNAc transferases, GT10 &#945;3/4-fucosyltransferases, and glycophosphotransferases, expected to mediate peripheral modifications of N-linked and perhaps other glycans, are represented by much smaller gene families in <it>D. purpureum</it>, and low amino acid sequence similarities make ortholog predictions for individual family members less certain. Thus, <it>D. purpureum </it>may exhibit reduced prevalence and diversity of its peripheral glycan modifications.</p>
<p>The most dramatic predicted difference between the two dictyostelid glycomes stems from the apparent absence in <it>D. purpureum </it>of the four-member CAZy GT17 class of GT-like proteins expected to mediate addition of peripheral bisecting and/or intersecting &#946;4-GlcNAc residues. We tested this by performing a matrix-assisted laser desorption/ionization-time of flight (MALDI-TOF) mass spectrometry glycomic analysis, which confirmed the presence in <it>D. discoideum </it>of N-glycans containing two peripheral GlcNAc residues and/or an &#945;3-linked core fucose, and revealed an apparent absence of these species in <it>D. purpureum </it>(Figure <figr fid="F6">6</figr>). The results suggest that CAZy family GT17 and GT10 sequences present in <it>D. discoideum </it>but absent from <it>D. purpureum </it>encode a novel N-glycan &#946;-GlcNAc transferase and a core &#945;3-fucosyltransferase, respectively, emphasizing the value of comparative genomics for predicting gene functions. Other studies have indicated that N-glycans are dominant contributors to the cell surface glycocalyx, and therefore may strongly influence intra- and inter-specific encounters with other amoebae, and interactions with potential predators, pathogens and prey. Thus, the dramatically different N-glycomes of these species might contribute to, for example, their differential sorting in interspecific mixtures <abbrgrp>
<abbr bid="B61">61</abbr>
</abbrgrp>.</p>
<fig id="F6"><title><p>Figure 6</p></title><caption><p>Comparison of the N-glycomes of <it>D. purpureum </it>and <it>D. discoideum </it>cells</p></caption><text>
   <p><b>Comparison of the N-glycomes of <it>D. purpureum </it>and <it>D. discoideum </it>cells</b>. Cells were harvested from co-cultures with <it>Klebsiella aerogenes</it>, and N-glycans were released from total CHAPS-solubilized, pepsin-digested protein using PNGase A <abbrgrp><abbr bid="B59">59</abbr><abbr bid="B60">60</abbr></abbrgrp>. <b>(a) </b>Matrix-assisted laser desorption/ionization-time of flight (MALDI-TOF)/TOF mass spectrometry spectrum of underivatized <it>D. discoideum </it>N-glycans. <b>(b) </b>Corresponding spectrum from <it>D. purpureum</it>. Structure assignments are based on glycan compositions derived from m/z values (H = Hex, N = HexNAc, F = Fuc), tandem mass spectrometry analysis, linkage analysis and exoglycosidase digestions. Brackets indicate uncertainties in the positions of peripheral GlcNAc (= N) and mannose (= H) residues. The major ions are [M + Na]<sup>+</sup>; minor [M + K]<sup>+ </sup>ions are also present. <it>D. purpureum </it>N-glycans lack &#945;3-linked core fucose and the fourth peripheral &#946;4-linked GlcNAc consistent with the absence of CAZy GT10 and GT17 genes predicted to encode the glycosyltransferases responsible for these peripheral modifications in <it>D. discoideum </it>(Table S16 in Additional file <supplr sid="S1">1</supplr>). A.u., arbitrary units.</p>
</text><graphic file="gb-2011-12-2-r20-6"/></fig>
</sec>
<sec>
<st>
<p>Other glycosylation events associated with the secretory pathway</p>
</st>
<p>A previous inspection of the predicted <it>D. discoideum </it>proteome also indicated the existence of some major classes of biosynthetic enzymes associated with mucin-type O-glycans, O-phosphoglycans, and glycosylphosphatidylinisotol (GPI) anchors <abbrgrp>
<abbr bid="B54">54</abbr>
</abbrgrp>, in agreement with biochemical studies <abbrgrp>
<abbr bid="B57">57</abbr>
</abbrgrp>. For example, mucin-type O-glycosylation is initiated in the Golgi by a CAZy GT60 polypeptide &#945;-GlcNAc transferase, conserved in both dictyostelids and related to the polypeptide &#945;-GalNAc transferases associated with mucin-type O-glycosylation in animals <abbrgrp>
<abbr bid="B62">62</abbr>
</abbrgrp>. Glycophosphorylation of the hydroxyamino acids threonine and serine may be less prevalent in <it>D. purpureum </it>owing to the much smaller size of its glycophosphotransferase-like gene family (Table S16). Although the glycogene comparison suggests a general conservation of these other aspects of the glycome, differences suggest that there may be equally dramatic variations as observed for N-glycosylation.</p>
</sec>
<sec>
<st>
<p>Cytoplasmic glycome</p>
</st>
<p>Whereas glycosylation occurs predominantly in the secretory compartments, formation of the precursors for these pathways generally originates in the cytoplasm, and the cytoplasm is also a site for catabolic deglycosylation. The genome encodes proteins associated with these functions as expected. In addition, like most eukaryotes, <it>D. discoideum </it>encodes a potential nucleo-cytoplasmic Spy-like GT41 O-GlcNAc transferase (OGT or Ser/Thr-&#946;GlcNAc transferase) and <it>D. purpureum </it>encodes two; the physiological function(s) of O-GlcNAc in protists is currently unknown <abbrgrp>
<abbr bid="B63">63</abbr>
</abbrgrp>. <it>D. discoideum </it>also possesses a complex cytoplasmic O-glycosylation pathway that modifies hydroxyproline and has an ancient evolutionary relationship with O-glycosylation in the secretory pathway and bacterial glycosylation <abbrgrp>
<abbr bid="B64">64</abbr>
</abbrgrp>. The genes of this pathway are highly conserved in <it>D. purpureum</it>, and bioinformatics and biochemical data indicate its partial conservation across at least four major protist phyla. This pathway is devoted to the modification of the E3 ubiquitin ligase subunit Skp1, and is involved in oxygen regulation of development in <it>D. discoideum </it>
<abbrgrp>
<abbr bid="B65">65</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Carbohydrate binding proteins</p>
</st>
<p>Many glycan functions are mediated <it>in trans </it>via carbohydrate binding domains (CBDs) or lectins. During initial remodeling within the rough endoplasmic reticulum, N-glycans are recognized by lectins in a folding/quality control cycle and, unlike many protists, this pathway appears to be highly conserved between the dictyostelids and animals <abbrgrp>
<abbr bid="B66">66</abbr>
</abbrgrp>. <it>D. discoideum </it>encodes numerous cytoplasmically localized lectins, including multiple discoidin, Cup and comitin proteins <abbrgrp>
<abbr bid="B67">67</abbr>
<abbr bid="B68">68</abbr>
<abbr bid="B69">69</abbr>
</abbrgrp>, and glycogen-binding proteins involved in metabolic regulation (Tables S18 and S19 in Additional file <supplr sid="S1">1</supplr>). Except for the latter, the natural glycan ligands in the cytoplasm are unknown. Interestingly, discoidins, like galectins of animals, exit cells via a non-classical process and potentially bind self, prey or predator glycans containing Gal or GalNAc <abbrgrp>
<abbr bid="B70">70</abbr>
</abbrgrp>. Discoidin and Cup CBDs appear to be dictyostelid-specific and evolutionarily dynamic, suggesting they serve species-specific functions as suggested for other lineage-specific expansions <abbrgrp>
<abbr bid="B71">71</abbr>
</abbrgrp>.</p>
</sec>
<sec>
<st>
<p>Carbohydrate catabolism</p>
</st>
<p>Both genomes encode a few more glycohydrolases (Table S16 in Additional file <supplr sid="S1">1</supplr>) than glycosyltransferases, with suspected substrates ranging from dietary polysaccharides and glycans of bacterial, yeast and perhaps other prey to endogenous glycans for recycling. Potentially 11 of the glycohydrolase domains are fused to carbohydrate binding modules (CBMs), a subset of CBDs associated with enzymes. As described for some cellulases such as CelA, the CBM may localize the enzyme to the target substrate after secretion, and may also directly promote catalysis <abbrgrp>
<abbr bid="B72">72</abbr>
</abbrgrp>. Peptidases may be localized at the cell surface by a similar mechanism. Cellulases are likely to be involved in remodeling of slime sheath cellulose during morphogenesis and spore coat breakdown during germination. <it>D. purpureum </it>and <it>D. discoideum </it>also have a cellulase associated with extracellular digestion in fungi and other cellulose-digesting organisms (CAZy GH7), suggesting a similar role in the social amoebae. Though the number of glycosyltransferases and known glycan binding proteins is 10 to 20% smaller in <it>D. purpureum </it>than <it>D. discoideum</it>, correlating with fewer peripheral modifications, the number of potential glycohydrolases is approximately 10% greater. The latter differences occur in lysozyme-, chitinase-, and alpha-mannosidase-like enzymes, suggesting variation in the spectrum of bacterial and yeast prey between the species.</p>
</sec>
</sec>
<sec>
<st>
<p>Multicellular development and dictyostelid sociality</p>
</st>
<p>The dictyostelid social amoebae undergo multicellular development when nutrients become limiting for vegetative growth. The ensuing events of aggregation of individual cells into an initial mound, slug migration, and ultimately fruiting body morphogenesis, require several cooperative interactions between the cells. These cooperative cellular behaviors include: cellular chemotaxis to self-generated, field-wide spiral waves of extracellular cAMP; the coordinated movements of cells within specialized tissues of the mounds and slugs requiring differential cell adhesion; an innate immune system; and the apparent altruism displayed by the pre-stalk cells that die as they construct the stalk, presumably to aid the dispersal of the spores in the sorus. The initial analyses of the <it>D. discoideum </it>genome uncovered a number of protein classes that might mediate this extensive cellular cooperation, and that were previously thought to be unique to metazoa <abbrgrp>
<abbr bid="B1">1</abbr>
</abbrgrp>. These proteins included certain subfamilies of ABC transporters, metabotropic GPCRs, and cell surface proteins predicted to contain repeated epidermal growth factor (EGF) or Ig-like domains that had not previously been seen in plants, fungi or amoebae.</p>
<p>One large family of 37 metazoan-like proteins described in <it>D. discoideum</it>, the Tiger (transmembrane, IPT, Ig-like, E-SET repeat) proteins, contain family members that mediate cell-cell interactions during development. Mutations in <it>tgrB1</it>, <it>tgrC1 </it>(formerly <it>lagC</it>), <it>tgrD1 </it>and <it>tgrE1 </it>all result in the arrest of development at the mound stage, and TgrB1 and TgrC1 have been implicated in a self/non-self recognition system that may mediate kin recognition <abbrgrp>
<abbr bid="B73">73</abbr>
</abbrgrp>. Twenty-six Tiger-protein encoding genes are present in the <it>D. purpureum </it>genome, including orthologs to <it>D. discoideum</it>'s <it>tgrC1</it>, <it>tgrD1</it>, <it>tgrF1</it>, <it>tgrK1</it>, <it>tgrM2</it>, and <it>tgrN1 </it>genes. Their presence suggests that the Tiger protein family may be generally involved in allorecognition in the dictyostelids.</p>
<p>An innate immune system has been recently described that functions during slug migration of <it>D. discoideum </it>and appears to be present in other group 4 dictyostelids, including <it>D. purpureum </it>
<abbrgrp>
<abbr bid="B74">74</abbr>
</abbrgrp>. It consists of a population of sentinel cells that patrol the body of the slug, engulf any bacteria that are present, bind to the slime sheath, and then exit the slug by being left behind in the slime trail. Sentinel cells are 1% of all slug cells and express particular genes that are related to innate immunity signaling genes in plants and animals, such as <it>slrA </it>and <it>tirA</it>. In particular, <it>tirA</it>, a Toll/interleukin receptor I domain containing protein, is required for some aspects of sentinel cell function <abbrgrp>
<abbr bid="B74">74</abbr>
</abbrgrp>. <it>D. purpureum </it>has orthologs for both <it>slrA </it>and <it>tirA</it>, as well as three amoeba-specific lysozymes (Additional file <supplr sid="S4">4</supplr>).</p>
<sec>
<st>
<p>Cyclic nucleotide signalling genes</p>
</st>
<p>cAMP controls many aspects of dictyostelid development. As a dynamically secreted chemoattractant it directs the cell movement that causes cells to aggregate, and aggregates to transform into fruiting structures. Secreted cAMP also triggers pre-spore differentiation, up-regulates the expression of aggregation genes and down-regulates stalk gene expression. As an intracellular messenger for other stimuli, cAMP induces spore and stalk encapsulation and maintains spore dormancy <abbrgrp>
<abbr bid="B23">23</abbr>
<abbr bid="B46">46</abbr>
<abbr bid="B75">75</abbr>
<abbr bid="B76">76</abbr>
</abbrgrp>.</p>
<p>In <it>D. discoideum</it>, 19 proteins are directly responsible for synthesis, detection and degradation of cAMP and its sister molecule, cGMP, which acts as a signaling intermediate for chemotaxis <abbrgrp>
<abbr bid="B77">77</abbr>
</abbrgrp>. To assess whether cyclic nucleotides play similar roles in <it>D. purpureum </it>development, we analyzed conservation and change in all genes that are directly involved in cyclic nucleotide signaling. <it>D. discoideum </it>uses the adenylate cyclases ACA, ACB and ACG and the guanylate cyclases sGC and GCA for synthesis of cAMP and cGMP, respectively <abbrgrp>
<abbr bid="B76">76</abbr>
<abbr bid="B78">78</abbr>
</abbrgrp>. All five cyclases are present in <it>D. purpureum </it>inclusive of their functional domain architecture (Figure <figr fid="F7">7a</figr>). The structurally distinct cell surface cAMP receptors (cARs) and intracellular cyclic nucleotide (cNMP) binding domains are the sole targets for cyclic nucleotides in dictyostelids. <it>D. discoideum </it>has four cARs, which are conserved in two other group 4 taxa, <it>D. mucoroides </it>and <it>Dictyostelium rosarium </it>
<abbrgrp>
<abbr bid="B79">79</abbr>
</abbrgrp>. Nonetheless, only the <it>cAR1 </it>and <it>cAR2 </it>genes were detected in the <it>D. purpureum </it>genome (Figure <figr fid="F7">7b</figr>). No firm conclusions about the absence of <it>cAR3 </it>and <it>cAR4 </it>can yet be drawn, since the assembly of this genome is not fully complete.</p>
<fig id="F7"><title><p>Figure 7</p></title><caption><p>Architectural conservation of cyclic nucleotide signaling genes</p></caption><text>
   <p><b>Architectural conservation of cyclic nucleotide signaling genes</b>. Deduced sequences of <it>D. discoideum </it>(<it>Ddis</it>) and <it>D. purpureum </it>(<it>Dpur</it>) proteins were analyzed by SMART <abbrgrp><abbr bid="B105">105</abbr></abbrgrp> for the presence of functional domains, signal peptides and transmembrane helices. To build protein phylogenies, conserved shared functional domains were aligned using CLUSTAL-W <abbrgrp><abbr bid="B106">106</abbr></abbrgrp> and edited when necessary in BioEdit <abbrgrp><abbr bid="B107">107</abbr></abbrgrp> to juxtapose functionally essential amino acid residues. Regions that did not align unambiguously were deleted. For proteins with two similar domains (cyclases and cyclic nucleotide (cNMP) binding proteins), a tandem alignment of both domains was used, with the single domains of ACB and ACG used twice. Phylogenetic relationships between aligned sequences were determined by Bayesian inference <abbrgrp><abbr bid="B108">108</abbr></abbrgrp> using a mixed amino acid model. Rate variation between sites was estimated by a gamma distribution with a proportion of invariable sites. Analyses were run for 100,000 generations or until the standard deviation of split frequences was &lt;0.01. The phylogenetic trees are decorated with the domain architectures of the proteins, except for the <it>D. mucoroides </it>(<it>Dmuc</it>) and <it>D. rosarium </it>(<it>Dros</it>) cAMP receptor (cAR) sequences, which were derived from genes that were only partially amplified by PCR <abbrgrp><abbr bid="B79">79</abbr></abbrgrp>. All trees are unrooted, except for the cAR tree, which is rooted on the single cAR of the group 3 taxon <it>Dictyostelium minutum </it>(<it>Dmin</it>). The posterior probabilities (BIPP) of nodes are represented by line thickness. <b>(a) </b>Cyclases; <b>(b) </b>cAMP receptors; <b>(c) </b>cNMP binding domains; <b>(d) </b>cNMP phosphodiesterases. <it>Dpur </it>protein IDs and, if available, dictyBase IDs: SGC, 153022 (DPU_G0054494); ACB, 154751 (DPU_G0058520); GCA, 151484 (DPU_G0075774); ACA, 51614 (DPU_G0071214); ACG, 38950 (DPU_G0061484); GbpC, 168746; GbpD, 88426 (DPU_G0055716); PdeD, 98774 (DPU_G0059600); PdeE, 56777 (DPU_G0059268); PkaR, 157660 (DPU_G0065616); cAR1, 99295 (DPU_G0064058); cAR2, 92050 (DPU_G0053090); Pde3, 34050 (DPU_G0053756); Pde4, 150656 (DPU_G0073898); PdsA, 98685 (DPU_G0058978); PdsB, 168741 (DPU_G0056384); PdsC, 91767 (DPU_G0073930). GenBank accession numbers for <it>Ddis </it>sequences: ACB, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAD50121">AAD50121</ext-link>]; GCA, [GenBank:<ext-link ext-link-type="gen" ext-link-id="CAB42641">CAB42641</ext-link>]; ACA, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAA33163">AAA33163</ext-link>]; ACG, [GenBank:<ext-link ext-link-type="gen" ext-link-id="Q03101">Q03101</ext-link>]; GbpC, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAM34041">AAM34041</ext-link>]; GbpD, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAM34042">AAM34042</ext-link>]; PdeD, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAL06059">AAL06059</ext-link>]; PdeE, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAL06060">AAL06060</ext-link>]; PkaR, [GenBank:<ext-link ext-link-type="gen" ext-link-id="P05987">P05987</ext-link>]; cAR1, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAA33177">AAA33177</ext-link>]; cAR2, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAB25436">AAB25436</ext-link>]; cAR3, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAB25437">AAB25437</ext-link>]; cAR4, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAB32419">AAB32419</ext-link>]; Pde3, [GenBank:<ext-link ext-link-type="gen" ext-link-id="B0G0Y8">B0G0Y8</ext-link>]; Pde4, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAO59486">AAO59486</ext-link>]; PdsA, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_637948">XP_637948</ext-link>]; Pde7, [GenBank:<ext-link ext-link-type="gen" ext-link-id="EAL62880">EAL62880</ext-link>]. GenBank accession numbers for <it>Dmuc </it>sequences: cAR1, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17575">ACF17575</ext-link>]; cAR2, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17576">ACF17576</ext-link>]; cAR3, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17577">ACF17577</ext-link>]; cAR4, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17578">ACF17578</ext-link>]. GenBank accession numbers for <it>Dros </it>sequences: cAR1, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAW24476">AAW24476</ext-link>]; cAR2, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAW24477">AAW24477</ext-link>]; cAR3, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17573">ACF17573</ext-link>]; cAR4, [GenBank:<ext-link ext-link-type="gen" ext-link-id="ACF17574">ACF17574</ext-link>]. GenBank accession number for <it>Dmin </it>cAR, [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAS59250">AAS59250</ext-link>].</p>
</text><graphic file="gb-2011-12-2-r20-7"/></fig>
<p>The cNMP binding domains are found in the regulatory subunit of PKA (PkaR), the cGMP binding proteins GbpC and GbpD and the phosphodiesterases (PDEs) PdeD and PdeE. PdeD is a cGMP phosphodiesterase that is stimulated by cGMP binding to its cNMP binding domains, while PdeE is a cAMP-stimulated cAMP phosphodiesterase <abbrgrp>
<abbr bid="B76">76</abbr>
<abbr bid="B80">80</abbr>
</abbrgrp>. GbpC is a complex multidomain protein in which cGMP binding to its cNMP binding domains sequentially activates the intrinsic RasGEF, Ras/Roc and protein kinase domain, which eventually leads to increased cell polarization. GbpD also contains a RasGEF domain, but no output protein kinase domain. Its cNMP binding domains are not functional and it functions as an antagonist of GbpC in the chemotactic response <abbrgrp>
<abbr bid="B81">81</abbr>
<abbr bid="B82">82</abbr>
</abbrgrp>. Genes encoding all five cNMP binding proteins with their complete sets of functional domains are present in the <it>D. purpureum </it>genome (Figure <figr fid="F7">7c</figr>).</p>
<p>In <it>D. discoideum </it>cyclic nucleotides are hydrolyzed by three structurally distinct PDEs <abbrgrp>
<abbr bid="B80">80</abbr>
</abbrgrp>. The cAMP PDEs RegA and Pde4 and the cGMP PDE Pde3 harbor a PDE_I type domain with HDc motif that is common to mammalian PDEs. The dual-specificity PDEs PdsA and PDE7 harbor a PDE_II type domain with HSHLDH motif. PdeD and PdeE, which hydrolyze cGMP and cAMP, respectively, carry a related HCHADHDS motif, but are structurally more similar to the lactamase_B protein family. The PDE_I and PDE_III enzymes are fully conserved between <it>D. discoideum </it>and <it>D. purpureum</it>, but the latter species has three instead of two type II PDEs (Figure <figr fid="F7">7d</figr>).</p>
<p>The high level of conservation between <it>D. discoideum </it>and <it>D. purpureum </it>of all adenylate and guanylate cyclases, cNMP binding domains and seven out of eight PDEs, combined with the complete conservation of functional domain architecture of these proteins, is indicative of the central roles of cAMP and cGMP in the control of chemotaxis, morphogenesis and gene regulation in the dictyostelids.</p>
</sec>
<sec>
<st>
<p>DIF signaling</p>
</st>
<p>DIF is produced predominantly by pre-spore cells during <it>D. discoideum </it>development and is part of a signaling mechanism that sets the ratio of stalk and spore cells produced in the fruiting body. It both limits the number of pre-spore cells produced and induces differentiation of a subset of pre-stalk cells. DIF is made by a three step biosynthetic pathway, in which a 12-carbon polyketide is assembled by the StlB polyketide synthase, then successively chlorinated by a chlorinating enzyme, and methylated by the DmtA methyltransferase <abbrgrp>
<abbr bid="B36">36</abbr>
<abbr bid="B83">83</abbr>
<abbr bid="B84">84</abbr>
</abbrgrp>. Clear <it>stlB </it>and <it>dmtA </it>homologs exist in the <it>D. purpureum </it>genome, as does a homologue of a recently identified FAD-dependent chlorinating enzyme (C Neumann, C Walsh and RR Kay, unpublished). DIF is inactivated by glutathione-dependent dechlorination <abbrgrp>
<abbr bid="B85">85</abbr>
</abbrgrp>, and again this enzyme has recently been identified and has a clear homolog in <it>D. purpureum </it>(F Velazquez and RR Kay, unpublished). It thus appears certain that <it>D. purpureum </it>makes and degrades DIF in a similar way to <it>D. discoideum</it>, and presumably utilizes it in a similar way to regulate multicellular development.</p>
</sec>
<sec>
<st>
<p>Social genes</p>
</st>
<p>Dictyostelids are interesting social organisms because about 20% of the cells in each fruiting body sacrifice themselves to build the stalk. Groups form through aggregation of formerly separate cells, so different clones can aggregate together, and do so in both the lab and in the field <abbrgrp>
<abbr bid="B86">86</abbr>
</abbrgrp>. Clones that successfully compete to get into spores, relegating their partners to the sterile stalk, will be more successful. Some degree of conflict is therefore predicted, and the resulting evolution of strategies and counter strategies may drive rapid adaptive evolution, as appears to be true for genes involved in host-parasite conflicts and male-female conflicts <abbrgrp>
<abbr bid="B87">87</abbr>
</abbrgrp>. But there is also a second reason to expect that social genes may evolve more rapidly than genes expressed primarily in the solitary stage. If the social stage occurs relatively infrequently, which seems likely but is unknown, then social genes are less scrutinized by selection and could accumulate more changes through genetic drift.</p>
<p>We tested for more rapid evolution using two ways of defining social genes. The first was to examine the set of genes that emerged from a selection for mutants that cheat (make more than their fair share of spores in mixtures) and compare them with all other genes <abbrgrp>
<abbr bid="B41">41</abbr>
</abbrgrp>. The two sets do not differ significantly in the probability of having homologs, suggesting that they neither differentially disappear nor differentially evolve beyond the point of clear homology (Figure S18a in Additional file <supplr sid="S1">1</supplr>). The two sets also do not differ in probability of having paralogs, suggesting that they do not duplicate at different rates (Figure S18b in Additional file <supplr sid="S1">1</supplr>). Finally, the two sets do not differ for either dN (the rate of non-synonymous change) or conservation score (a measure that declines with both point differences and with non-aligned portions of the sequences) (Figures S18c and S19d in Additional file <supplr sid="S1">1</supplr>). However, this set of social genes is relatively small, and some will be false positives (of 198 genes identified, 40 were tested for cheating, of which 31 were cheaters).</p>
<p>A larger set of social genes can be identified using RNA-seq reads from the vegetative stage and six social time points (4, 8, 12, 16, 20, and 24 hours after starving) <abbrgrp>
<abbr bid="B15">15</abbr>
</abbrgrp>. Using genes with sufficient reads and high reproducibility (Additional file <supplr sid="S1">1</supplr>), we defined a gene's index of social expression as the average percentage representation in the social-stage libraries over that average plus the percentage representation in vegetative stage (that is, Social expression/Social expression + Vegetative expression).</p>
<p>Using this classification, social genes showed higher rates of change, and manifested fewer orthologs, higher rates of non-synonymous substitution, and lower conservation scores. Genes with orthologs in <it>D. discoideum </it>and <it>D. purpureum </it>have a significantly lower social expression index in <it>D. discoideum </it>than those without orthologs (Figure S19a in Additional file <supplr sid="S1">1</supplr>; <it>n </it>= 1,739, 1,300, <it>P </it>&lt; 2.2e-16, Mann-Whitney U test). This is driven by significant differences in each time point of the developmental stages (data not shown). An analysis using genes with <it>D. purpureum </it>RNA-seq data following the above criteria gives a similar overall result (Figure S19b in Additional file <supplr sid="S1">1</supplr>; <it>n </it>= 3,649, 2,102, <it>P </it>&lt; 2.2e-16, Mann-Whitney U test). Thus, genes with more social expression are less likely to have orthologs, indicating more rapid evolution in the gain or loss of genes, or in change of genes beyond the point where they are identifiable as homologs. Homologs that had inparalogs show no significant difference of social indices from those that lacked inparalogs when the social expression is measured with RNA-seq reads from <it>D. discoideum </it>(Figure S19c in Additional file <supplr sid="S1">1</supplr>; <it>n </it>= 95, 1,644, <it>P </it>= 0.93, Mann-Whitney U test) and <it>D. purpureum </it>(Figure S19d in Additional file <supplr sid="S1">1</supplr>; <it>n </it>= 137, 3,512, <it>P </it>= 0.24, Mann-Whitney U test), suggesting no significant bias of duplication for the social genes of dictyostelids.</p>
<p>Figure <figr fid="F8">8a</figr> plots conservation score and rates of non-synonymous substitution (dN) as a function of the <it>D. discoideum </it>social expression index. As the percentage of a gene's RNA-seq reads found in social stages increases, there is a significant drop in conservation score and a significant increase in dN, supporting the hypothesis that social genes change more rapidly than vegetative ones. The same significant results hold if we use the RNA-seq reads of <it>D. purpureum </it>genes (Figure <figr fid="F8">8b</figr>). Figure S20 in Additional file <supplr sid="S1">1</supplr> shows how the effect is partitioned between different social stages. Previous studies have suggested that individual social genes or small sets of them evolve rapidly because of evolutionary arms races, with conflict driving continuing adaptation and counter-adaptation <abbrgrp>
<abbr bid="B88">88</abbr>
</abbrgrp>. This is the first such evidence on a genomic scale. Nonetheless, we cannot rule out the alternative hypotheses that the lower selective scrutiny of social genes might arise if the social stage is not very frequent and not as selectively important as the vegetative stage. Distinguishing these hypotheses further will have to await the more sensitive tests that can be applied to genomes that are more closely related than <it>D. discoideum </it>and <it>D. purpureum</it>.</p>
<fig id="F8"><title><p>Figure 8</p></title><caption><p>Conservation score (CS, blue open circles) and non-synonymous substitution rate (dN, red crosses) as a function of the degree of a gene's expression in social versus vegetative stages (a,b) or of sexual versus vegetative stages (c)</p></caption><text>
   <p><b>Conservation score (CS, blue open circles) and non-synonymous substitution rate (dN, red crosses) as a function of the degree of a gene's expression in social versus vegetative stages (a,b) or of sexual versus vegetative stages (c)</b>. <b>(a) </b>For <it>D. discoideum </it>RNA-seq reads (1,739 genes) both regressions are significant (CS, y = -0.17x + 0.68, R<sup>2 </sup>= 0.063, <it>P </it>&lt; 0.0001; dN, y = 0.11x + 0.21, R<sup>2 </sup>= 0.032, <it>P </it>&lt; 0.0001). <b>(b) </b>For <it>D. purpureum </it>RNA-seq reads (3,649 genes), both regressions are also significant (CS, y = -0.20x + 0.69, R<sup>2 </sup>= 0.11, <it>P </it>&lt; 0.0001; dN, y = 0.14x + 0.21, R<sup>2 </sup>= 0.017, <it>P </it>&lt; 0.0001). <b>(c) </b>Conservation score and non-synonymous substitution rate as a function of the percentage of <it>D. discoideum </it>ESTs expressed in the gamete stage (932 genes, including 835 and 16 genes with a gamete expression index of 0% and 100%, respectively). Both regressions are significant: CS, y = -0.0070x + 0.73, R<sup>2 </sup>= 0.0072, <it>P </it>&lt; 0.01; dN, y = 0.00051x + 0.17, R<sup>2 </sup>= 0.00708, <it>P </it>= 0.01.</p>
</text><graphic file="gb-2011-12-2-r20-8"/></fig>
<p>
<it>Dictyostelium </it>has a sexual cycle in which two cells fuse and then engulf many other cells to form a giant macrocyst that undergoes meiosis. However, with the exception of one successful cross <abbrgrp>
<abbr bid="B89">89</abbr>
</abbrgrp>, the sexual system has not been available in lab studies of <it>D. discoideum</it>. Although macrocysts are readily formed, there are problems with germination <abbrgrp>
<abbr bid="B90">90</abbr>
</abbrgrp> and, when there is germination, there may be no recombinants <abbrgrp>
<abbr bid="B91">91</abbr>
</abbrgrp>. Finding the right conditions for sex would add a valuable genetic dimension to <it>D. discoideum </it>studies, but this search would be fruitless if most strains have lost the ability to have sex. If they have lost this ability, we would expect that sex-specific genes would have degraded. We tested this hypothesis using ESTs from gamete-stage libraries made from cells grown in conditions that make them competent for fusion <abbrgrp>
<abbr bid="B92">92</abbr>
</abbrgrp>. Figure <figr fid="F8">8c</figr> shows that genes expressed disproportionately in the gamete stage are actually more conserved than other genes, as measured by both dN and conservation score. Provided these truly are sex-specific genes, then it appears that the macrocyst system is functional and not degenerating in <it>D. discoideum</it>. This is supported by an analysis showing that 13 meiosis genes <abbrgrp>
<abbr bid="B93">93</abbr>
</abbrgrp> have normal dN and conservation score values compared to other genes (Figure S21 in Additional file <supplr sid="S1">1</supplr>).</p>
</sec>
</sec>
</sec>
<sec>
<st>
<p>Conclusions</p>
</st>
<p>Comparisons of the <it>D. purpureum </it>genome, the second group 4 dictyostelid to be sequenced, with the previously sequenced <it>D. discoideum </it>have provided insights into the evolution of this clade of social amoebae. Like <it>D. discoideum</it>, the genome of <it>D. purpureum </it>encodes a high number of triplet nucleotide repeats distributed in both exonic and non-protein-coding regions. However, these tracts are not generally congruent between the two genomes, indicating that their expansion is a consequence of an intrinsic physiology favoring high rates of triplet repeat formation, rather than retention and accumulation of ancient triplet repeats. Although the <it>D. purpureum </it>genome was not finished to the same extent as the <it>D. discoideum </it>genome, syntenic regions containing orthologous genes are detected. Genes that have been hypothesized as having been acquired through horizontal gene transfer in the <it>D. discoideum </it>genome have orthologs in the <it>D. purpureum </it>genome; thus, any HGT events involving these genes likely occurred in the common ancestor of the group 4 dictyostelids. Likewise, large gene families of ABC transporters and histidine kinases underwent expansion in the common ancestor before the species line split, while the expansion of polyketide synthase genes occurred in a lineage-specific manner. The repertoire of microfilament system proteins is virtually identical between the two species, but the regulatory proteins differ. Two distinct transferases involved in the N-linked glycosylation were detected in <it>D. discoideum </it>but not in <it>D. purpureum</it>, and the predicted change in the glycosylation state of the respective species proteins was validated through glycomic analysis. Comparative analyses also enabled the identification of two novel classes of ncRNAs specific to the dictyostelid lineage. High conservation of enzymes involved in cNMP metabolism and DIF production and degradation indicate the central role these signaling systems play in the social behavior of these amoebozoa. A detailed comparison of the variation between cohorts of genes with specific expression patterns between the two genomes demonstrate that genes involved in sociality evolve more rapidly, probably due to continuous adaptation and counter-adaptation.</p>
</sec>
<sec>
<st>
<p>Materials and methods</p>
</st>
<sec>
<st>
<p>Sequence and assembly</p>
</st>
<p>
<it>D. purpureum </it>was described in 1902 by Olive <abbrgrp>
<abbr bid="B94">94</abbr>
</abbrgrp>. <it>D. purpureum </it>isolate QSDP1 from the Queller and Strassmann laboratories at Rice University, and its axenic derivative DpAX1, were used in this study. DpAX1 was selected from QSDP1 for the ability to grow axenically, in defined liquid media, by culturing in plastic Petri dishes containing HL5 medium supplemented with 10% fetal bovine serum <abbrgrp>
<abbr bid="B95">95</abbr>
</abbrgrp>.</p>
<p>QSDP1 was used for EST production and sequencing. Cells were grown in association with <it>Klebsiella pneumoniae</it>, harvested and developed on nitrocellulose filters as described <abbrgrp>
<abbr bid="B95">95</abbr>
</abbrgrp>. RNA samples were prepared from developing cells at 0, 6, 12, and 18 hours <abbrgrp>
<abbr bid="B45">45</abbr>
</abbrgrp>. Two cDNA libraries were prepared from each of these four RNA samples and a total of 14,949 validated EST clones were sequenced from them. Briefly, polyA-selected RNA was reverse transcribed with superscript reverse transcriptase III (Invitrogen, Carlsbad, CA, USA) using dT primer (5' GACTAGTTCTAGATCGCGAG CGGCCGCCCTTTTTTTTTTTTTTTVN-3'). cDNA was synthesized with <it>Escherichia coli </it>DNA polymerase I, <it>E. coli </it>DNA ligase, and <it>E. coli </it>RNaseH. The DNA ends were repaired with T4 DNA polymerase. SalI adapters (5'-TCGACCCACGCGTCCG-3' and 5'-P0<sub>4</sub>-CGGACGCGTGGG-3') were ligated to cDNA and the product was digested with NotI. The cDNA digestion products were gel purified and directionally ligated into SalI- and NotI-digested pCMVsport6 and transformed into ElectroMAX, T1 DH10B <it>E. coli </it>cells (Invitrogen). Plasmid DNA was amplified by a rolling circle method (Templiphi, GE Healthcare, Piscataway, NJ, USA) and purified. The insert of each clone was sequenced from both ends with primers complementary to flanking vector sequences using Big Dye terminator chemistry and resolved by an ABI 3730 sequenator (ABI, Foster City, CA, USA).</p>
<p>To prepare high quality genomic DNA, DpAX1 cells were grown in shaking cultures in HL5 medium, and DNA was prepared from isolated nuclei by cesium chloride equilibrium density gradients. Genomic libraries were constructed by shearing genomic DNA with a Hydroshear (Genomic Solutions Inc., Ann Arbor, MI, USA) to create 6- to 10-kb fragments. The DNA fragments were size selected, purified, blunt-end repaired (End-It Kit, Epicentre Biotechnologies Madison, WI, USA) and ligated into a pMCL200 vector. The ligation product was purified and precipitated, and then transformed into ElectroMax DH10B competent cells (Invitrogen). The percentage of no-insert clones in the library was assessed by colony PCR, using primers flanking the cloning site (Expand long Template PCR system, Roche Applied Science, Indianapolis, IND, USA). Genomic DNA libraries with average insert sizes of 2.3 to 3.0 kb and 3 to 4 kb were produced by similar methods.</p>
<p>Primary sequence data were derived from whole-genome shotgun sequencing of the three plasmid libraries <abbrgrp>
<abbr bid="B96">96</abbr>
</abbrgrp>. The reads were screened for vector sequence with cross_match <abbrgrp>
<abbr bid="B97">97</abbr>
</abbrgrp> and trimmed for vector and low quality sequences. Reads shorter than 100 bases after trimming were excluded from the assembly. The trimmed read sequence data were assembled with release 1.0.3 of Jazz, a whole genome shotgun assembler <abbrgrp>
<abbr bid="B98">98</abbr>
</abbrgrp>. The assembly was next filtered for redundant scaffolds that matched larger scaffolds (&lt;5 kb length where &gt;80% matched a scaffold of &gt;5 kb length). Finally, scaffolds that showed homology to prokaryotic and non-cellular contaminants (viroids and viruses) were identified and removed. The filtered assembly contains 799 scaffolds, comprising 33.0 Mb, with an estimated sequence coverage of 8.41 &#215; (Additional file <supplr sid="S1">1</supplr>). The data were deposited in GenBank under project ID 30991 [GenBank:<ext-link ext-link-id="ADID00000000" ext-link-type="gen">ADID00000000</ext-link>].</p>
</sec>
<sec>
<st>
<p>The JGI genome annotation pipeline</p>
</st>
<p>For genome annotation we use the JGI annotation pipeline, which combines several gene prediction, annotation and analysis tools. First, the genome assembly is masked using RepeatMasker and a custom repeat library. Next, available ESTs and full-length cDNAs are clustered and aligned to the scaffolds with BLAT. Model organism protein sequences from the non-redundant set of proteins from the National Center for Biotechnology Information (GenBank) are aligned to the scaffolds with BLASTX <abbrgrp>
<abbr bid="B22">22</abbr>
</abbrgrp>. Gene models and associated transcripts/proteins are predicted or mapped using (i) data from putative full-length cDNAs derived from available mRNA, ESTs and EST clusters, (ii) homology-based methods Genewise and Fgenesh+, and (iii) <it>ab initio </it>method Fgenesh trained on putative full-length genes (see above), manually curated genes (if available), and reliable homology-based models. Additional gene models generated externally with other gene predictors trained for a particular genome can be added as well. The clustered ESTs/cDNAs are used to extend and correct predicted gene models where the exons overlap and splice junctions are not consistent in comparing EST sequences to gene models. This often adds 5' and/or 3' UTRs to the models. With gene structure in place, function is assigned to models based on Smith-Waterman homology to annotated genes from nr, KEGG, and KOG databases. InterproScan is used to identify predicted domains and the Gene Ontology is used to identify function and/or subcellular location. SignalP is used to assist with identification of secreted proteins. Since multiple models with overlapping sequences are generated for each locus, a single model is chosen to produce a non-redundant set of genes. Model selection is based on homology to known proteins from other organisms, EST support, as well as protein and transcript completeness (that is, inclusion of 5' methionine, 3' stop codon, and UTRs). This automatically generated set was further refined by manual curation and submitted to GenBank. Whole genome analysis is performed on the non-redundant set of gene models or a snapshot of a manually curated gene catalog assuming the latter includes significant number of changes compared to the automatically generated non-redundant set.</p>
</sec>
</sec>
<sec>
<st>
<p>Abbreviations</p>
</st>
<p>ABC: ATP-binding cassette; ADF: actin-depolymerizing factor; bp: base pair; bZIP: basic leucine zipper; cAR: cAMP receptor; CBD: carbohydrate binding domain; CBM: carbohydrate binding module; CH: calponin homology; cNMP: cyclic nucleoside monophosphate; DIF: differentiation-inducing factor; DUSE: <it>Dictyostelium </it>upstream sequence element; EST: expressed sequence tag; GPCR: G-protein coupled receptor; HGT: horizontal gene transfer; ncRNA: non-coding RNA; NSBR: non self-binding region; PDE: phosphodiesterase; PKA: cAMP dependent protein kinase; PKS: polyketide synthase; UTR: untranslated region.</p>
</sec>
<sec>
<st>
<p>Competing interests</p>
</st>
<p>The authors declare that they have no competing interests.</p>
</sec>
<sec>
<st>
<p>Authors' contributions</p>
</st>
<p>MK-K and GS derived the DpAx1 strain and purified the nucleic acids used in the project; Alan K, ED, HT, KB, EL, HS, DB, JS, and AS produced the primary DNA sequence, genome assembly, and gene annotation within the JGI pipeline; PF, PG, SB, YB and RLC carried out annotation and data accessibility at dictyBase; CA, MMB, XT, WS, AP, CLF, HvdW EH, CMW, WFL, GS, CD, PMC, TS, ME, PS, RRK, BH, LE, FR, and GS were involved in the analysis of the data and drafted sections of the paper; AP carried out the ortholog and paralog predictions; WS annotated the non-coding RNAs; NHP carried out the phylogeny and synteny analyses; CLF, HvdW, PMC, BH, and CMW carried out the glycoprotein analyses; JES, DCQ, RS, Adam K, and IVG provided overall project management; and Adam K assembled and edited the manuscript.</p>
</sec>
</bdy><bm>
<ack>
<sec>
<st>
<p>Acknowledgements</p>
</st>
<p>This work was performed under the auspices of the US Department of Energy's Office of Science, Biological and Environmental Research Program and the University of California, Lawrence Berkeley National Laboratory under contract No. DE-AC02-05CH11231, Lawrence Livermore National Laboratory under Contract No. DE-AC52-07NA27344, Los Alamos National Laboratory under contract No. DE-AC02-06NA25396. The annotation effort was supported by grants HD39691 (A Kuspa, GS, and RS), GM64426 (RLC), HG0022 (RLC) and GM84383 (CMW) from the National Institute of Health, and by grants EF-0626963 and DEB-0918931 (JES and DCQ) from the National Science Foundation. AP was supported by a fellowship from the Keck Center for Interdisciplinary Bioscience Training of the Gulf Coast Consortia (NIH Grants 1 T90 DA022885 and 1 R90 DA023418).</p>
</sec>
</ack>
<refgrp><bibl id="B1"><title><p>The genome of the social amoeba <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Eichinger</snm><fnm>L</fnm></au><au><snm>Pachebat</snm><fnm>JA</fnm></au><au><snm>Gl&#246;ckner</snm><fnm>G</fnm></au><au><snm>Rajandream</snm><fnm>MA</fnm></au><au><snm>Sucgang</snm><fnm>R</fnm></au><au><snm>Berriman</snm><fnm>M</fnm></au><au><snm>Song</snm><fnm>J</fnm></au><au><snm>Olsen</snm><fnm>R</fnm></au><au><snm>Szafranski</snm><fnm>K</fnm></au><au><snm>Xu</snm><fnm>Q</fnm></au><au><snm>Tunggal</snm><fnm>B</fnm></au><au><snm>Kummerfeld</snm><fnm>S</fnm></au><au><snm>Madera</snm><fnm>M</fnm></au><au><snm>Konfortov</snm><fnm>BA</fnm></au><au><snm>Rivero</snm><fnm>F</fnm></au><au><snm>Bankier</snm><fnm>AT</fnm></au><au><snm>Lehmann</snm><fnm>R</fnm></au><au><snm>Hamlin</snm><fnm>N</fnm></au><au><snm>Davies</snm><fnm>R</fnm></au><au><snm>Gaudet</snm><fnm>P</fnm></au><au><snm>Fey</snm><fnm>P</fnm></au><au><snm>Pilcher</snm><fnm>K</fnm></au><au><snm>Chen</snm><fnm>G</fnm></au><au><snm>Saunders</snm><fnm>D</fnm></au><au><snm>Sodergren</snm><fnm>E</fnm></au><au><snm>Davis</snm><fnm>P</fnm></au><au><snm>Kerhornou</snm><fnm>A</fnm></au><au><snm>Nie</snm><fnm>X</fnm></au><au><snm>Hall</snm><fnm>N</fnm></au><au><snm>Anjard</snm><fnm>C</fnm></au><etal/></aug><source>Nature</source><pubdate>2005</pubdate><volume>435</volume><fpage>43</fpage><lpage>57</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature03481</pubid><pubid idtype="pmcid">1352341</pubid><pubid idtype="pmpid">15875012</pubid></pubidlist></xrefbib></bibl><bibl id="B2"><title><p>A revised six-kingdom system of life.</p></title><aug><au><snm>Cavalier-Smith</snm><fnm>T</fnm></au></aug><source>Biol Rev Camb Philos Soc</source><pubdate>1998</pubdate><volume>73</volume><fpage>203</fpage><lpage>266</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1017/S0006323198005167</pubid><pubid idtype="pmpid" link="fulltext">9809012</pubid></pubidlist></xrefbib></bibl><bibl id="B3"><title><p>The analysis of 100 genes supports the grouping of three highly divergent amoebae: <it>Dictyostelium</it>, Entamoeba, and Mastigamoeba.</p></title><aug><au><snm>Bapteste</snm><fnm>E</fnm></au><au><snm>Brinkmann</snm><fnm>H</fnm></au><au><snm>Lee</snm><fnm>JA</fnm></au><au><snm>Moore</snm><fnm>DV</fnm></au><au><snm>Sensen</snm><fnm>CW</fnm></au><au><snm>Gordon</snm><fnm>P</fnm></au><au><snm>Durufle</snm><fnm>L</fnm></au><au><snm>Gaasterland</snm><fnm>T</fnm></au><au><snm>Lopez</snm><fnm>P</fnm></au><au><snm>Muller</snm><fnm>M</fnm></au><au><snm>Philippe</snm><fnm>H</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2002</pubdate><volume>99</volume><fpage>1414</fpage><lpage>1419</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.032662799</pubid><pubid idtype="pmcid">122205</pubid><pubid idtype="pmpid">11830664</pubid></pubidlist></xrefbib></bibl><bibl id="B4"><title><p>Higher-order phylogeny of plasmodial slime molds (Myxogastria) based on elongation factor 1-A and small subunit rRNA gene sequences.</p></title><aug><au><snm>Fiore-Donno</snm><fnm>AM</fnm></au><au><snm>Berney</snm><fnm>C</fnm></au><au><snm>Pawlowski</snm><fnm>J</fnm></au><au><snm>Baldauf</snm><fnm>SL</fnm></au></aug><source>J Eukaryot Microbiol</source><pubdate>2005</pubdate><volume>52</volume><fpage>201</fpage><lpage>210</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1550-7408.2005.00032.x</pubid><pubid idtype="pmpid" link="fulltext">15926995</pubid></pubidlist></xrefbib></bibl><bibl id="B5"><title><p>Evolutionary position of breviate amoebae and the primary eukaryote divergence.</p></title><aug><au><snm>Minge</snm><fnm>MA</fnm></au><au><snm>Silberman</snm><fnm>JD</fnm></au><au><snm>Orr</snm><fnm>RJ</fnm></au><au><snm>Cavalier-Smith</snm><fnm>T</fnm></au><au><snm>Shalchian-Tabrizi</snm><fnm>K</fnm></au><au><snm>Burki</snm><fnm>F</fnm></au><au><snm>Skjaeveland</snm><fnm>A</fnm></au><au><snm>Jakobsen</snm><fnm>KS</fnm></au></aug><source>Proc Biol Sci</source><pubdate>2009</pubdate><volume>276</volume><fpage>597</fpage><lpage>604</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1098/rspb.2008.1358</pubid><pubid idtype="pmcid">2660946</pubid><pubid idtype="pmpid">19004754</pubid></pubidlist></xrefbib></bibl><bibl id="B6"><title><p>Deep phylogeny and evolution of slime moulds (Mycetozoa).</p></title><aug><au><snm>Fiore-Donno</snm><fnm>AM</fnm></au><au><snm>Nikolaev</snm><fnm>SI</fnm></au><au><snm>Nelson</snm><fnm>M</fnm></au><au><snm>Pawlowski</snm><fnm>J</fnm></au><au><snm>Cavalier-Smith</snm><fnm>T</fnm></au><au><snm>Baldauf</snm><fnm>SL</fnm></au></aug><source>Protist</source><pubdate>2010</pubdate><volume>161</volume><fpage>55</fpage><lpage>70</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.protis.2009.05.002</pubid><pubid idtype="pmpid" link="fulltext">19656720</pubid></pubidlist></xrefbib></bibl><bibl id="B7"><title><p>Molecular phylogeny and evolution of morphology in the social amoebas.</p></title><aug><au><snm>Schaap</snm><fnm>P</fnm></au><au><snm>Winckler</snm><fnm>T</fnm></au><au><snm>Nelson</snm><fnm>M</fnm></au><au><snm>Alvarez-Curto</snm><fnm>E</fnm></au><au><snm>Elgie</snm><fnm>B</fnm></au><au><snm>Hagiwara</snm><fnm>H</fnm></au><au><snm>Cavender</snm><fnm>J</fnm></au><au><snm>Milano-Curto</snm><fnm>A</fnm></au><au><snm>Rozen</snm><fnm>DE</fnm></au><au><snm>Dingermann</snm><fnm>T</fnm></au><au><snm>Mutzel</snm><fnm>R</fnm></au><au><snm>Baldauf</snm><fnm>SL</fnm></au></aug><source>Science</source><pubdate>2006</pubdate><volume>314</volume><fpage>661</fpage><lpage>663</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1130670</pubid><pubid idtype="pmcid">2173941</pubid><pubid idtype="pmpid">17068267</pubid></pubidlist></xrefbib></bibl><bibl id="B8"><aug><au><snm>Raper</snm><fnm>KB</fnm></au></aug><source>The Dictyostelids</source><publisher>Princeton, NJ: Princeton University Press</publisher><pubdate>1984</pubdate></bibl><bibl id="B9"><title><p>Interspecific mixtures in the Dictyosteliaceae.</p></title><aug><au><snm>Raper</snm><fnm>KB</fnm></au><au><snm>Thom</snm><fnm>C</fnm></au></aug><source>Am J Bot</source><pubdate>1941</pubdate><volume>28</volume><fpage>69</fpage><lpage>78</lpage><xrefbib><pubid idtype="doi">10.2307/2437063</pubid></xrefbib></bibl><bibl id="B10"><title><p>Social evolution: kin preference in a social microbe.</p></title><aug><au><snm>Mehdiabadi</snm><fnm>NJ</fnm></au><au><snm>Jack</snm><fnm>CN</fnm></au><au><snm>Farnham</snm><fnm>TT</fnm></au><au><snm>Platt</snm><fnm>TG</fnm></au><au><snm>Kalla</snm><fnm>SE</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au></aug><source>Nature</source><pubdate>2006</pubdate><volume>442</volume><fpage>881</fpage><lpage>882</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/442881a</pubid><pubid idtype="pmpid" link="fulltext">16929288</pubid></pubidlist></xrefbib></bibl><bibl id="B11"><title><p>Kin discrimination increases with genetic distance in a social amoeba.</p></title><aug><au><snm>Ostrowski</snm><fnm>EA</fnm></au><au><snm>Katoh</snm><fnm>M</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au></aug><source>PLoS Biol</source><pubdate>2008</pubdate><volume>6</volume><fpage>e287</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pbio.0060287</pubid><pubid idtype="pmcid">2586364</pubid><pubid idtype="pmpid">19067487</pubid></pubidlist></xrefbib></bibl><bibl id="B12"><aug><au><snm>Loomis</snm><fnm>WF</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au></aug><source>Dictyostelium Genomics</source><publisher>Norfolk: Horizon Bioscience</publisher><edition>1</edition><pubdate>2005</pubdate></bibl><bibl id="B13"><title><p>JGI Dictyostelium purpureum genome portal.</p></title><url>http://genome.jgi-psf.org/Dicpu1/Dicpu1.home.html</url></bibl><bibl id="B14"><title><p>dictyBase.</p></title><url>http://dictybase.org/</url></bibl><bibl id="B15"><title><p>Conserved developmental transcriptomes in evolutionary divergent species.</p></title><aug><au><snm>Parikh</snm><fnm>A</fnm></au><au><snm>Miranda</snm><fnm>ER</fnm></au><au><snm>Katoh-Kurasawa</snm><fnm>M</fnm></au><au><snm>Fuller</snm><fnm>D</fnm></au><au><snm>Rot</snm><fnm>G</fnm></au><au><snm>Zagar</snm><fnm>L</fnm></au><au><snm>Curk</snm><fnm>T</fnm></au><au><snm>Sucgang</snm><fnm>R</fnm></au><au><snm>Chen</snm><fnm>R</fnm></au><au><snm>Zupan</snm><fnm>B</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au></aug><source>Genome Biol</source><pubdate>2010</pubdate><volume>11</volume><fpage>R35</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/gb-2010-11-3-r35</pubid><pubid idtype="pmcid">2864575</pubid><pubid idtype="pmpid">20236529</pubid></pubidlist></xrefbib></bibl><bibl id="B16"><title><p>Evolutionary dynamics of microsatellite DNA.</p></title><aug><au><snm>Schlotterer</snm><fnm>C</fnm></au></aug><source>Chromosoma</source><pubdate>2000</pubdate><volume>109</volume><fpage>365</fpage><lpage>371</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1007/s004120000089</pubid><pubid idtype="pmpid" link="fulltext">11072791</pubid></pubidlist></xrefbib></bibl><bibl id="B17"><title><p>Trinucleotide repeats and long homopeptides in genes and proteins associated with nervous system disease and development.</p></title><aug><au><snm>Karlin</snm><fnm>S</fnm></au><au><snm>Burge</snm><fnm>C</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>1996</pubdate><volume>93</volume><fpage>1560</fpage><lpage>1565</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.93.4.1560</pubid><pubid idtype="pmcid">39980</pubid><pubid idtype="pmpid">8643671</pubid></pubidlist></xrefbib></bibl><bibl id="B18"><title><p>Diseases of unstable repeat expansion: mechanisms and common principles.</p></title><aug><au><snm>Gatchel</snm><fnm>JR</fnm></au><au><snm>Zoghbi</snm><fnm>HY</fnm></au></aug><source>Nat Rev Genet</source><pubdate>2005</pubdate><volume>6</volume><fpage>743</fpage><lpage>755</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nrg1691</pubid><pubid idtype="pmpid" link="fulltext">16205714</pubid></pubidlist></xrefbib></bibl><bibl id="B19"><title><p>Genome nucleotide composition shapes variation in simple sequence repeats.</p></title><aug><au><snm>Tian</snm><fnm>X</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2010</pubdate><volume>28</volume><fpage>899</fpage><lpage>909</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msq266</pubid><pubid idtype="pmpid" link="fulltext">20943830</pubid></pubidlist></xrefbib></bibl><bibl id="B20"><title><p>Comparing the <it>Dictyostelium </it>and Entamoeba genomes reveals an ancient split in the Conosa lineage.</p></title><aug><au><snm>Song</snm><fnm>J</fnm></au><au><snm>Xu</snm><fnm>Q</fnm></au><au><snm>Olsen</snm><fnm>R</fnm></au><au><snm>Loomis</snm><fnm>W</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au><au><snm>Sucgang</snm><fnm>R</fnm></au></aug><source>PLoS Comput Biol</source><pubdate>2005</pubdate><volume>1</volume><fpage>e71</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pcbi.0010071</pubid><pubid idtype="pmcid">1314882</pubid><pubid idtype="pmpid">16362072</pubid></pubidlist></xrefbib></bibl><bibl id="B21"><title><p>An alternative flavin-dependent mechanism for thymidylate synthesis.</p></title><aug><au><snm>Myllykallio</snm><fnm>H</fnm></au><au><snm>Lipowski</snm><fnm>G</fnm></au><au><snm>Leduc</snm><fnm>D</fnm></au><au><snm>Filee</snm><fnm>J</fnm></au><au><snm>Forterre</snm><fnm>P</fnm></au><au><snm>Liebl</snm><fnm>U</fnm></au></aug><source>Science</source><pubdate>2002</pubdate><volume>297</volume><fpage>105</fpage><lpage>107</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1072113</pubid><pubid idtype="pmpid" link="fulltext">12029065</pubid></pubidlist></xrefbib></bibl><bibl id="B22"><title><p>NCBI.</p></title><url>http://www.ncbi.nlm.nih.gov/</url></bibl><bibl id="B23"><title><p>Cytokinins induce sporulation in <it>Dictyostelium</it>.</p></title><aug><au><snm>Anjard</snm><fnm>C</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Development</source><pubdate>2008</pubdate><volume>135</volume><fpage>819</fpage><lpage>827</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1242/dev.018051</pubid><pubid idtype="pmpid" link="fulltext">18216168</pubid></pubidlist></xrefbib></bibl><bibl id="B24"><title><p>Identification of a penicillin-sensitive carboxypeptidase in the cellular slime mold <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Yasukawa</snm><fnm>H</fnm></au><au><snm>Kuroita</snm><fnm>T</fnm></au><au><snm>Tamura</snm><fnm>K</fnm></au><au><snm>Yamaguchi</snm><fnm>K</fnm></au></aug><source>Biol Pharm Bull</source><pubdate>2003</pubdate><volume>26</volume><fpage>1018</fpage><lpage>1020</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1248/bpb.26.1018</pubid><pubid idtype="pmpid" link="fulltext">12843630</pubid></pubidlist></xrefbib></bibl><bibl id="B25"><title><p>Polyphosphate kinase 1, a conserved bacterial enzyme, in a eukaryote, <it>Dictyostelium discoideum</it>, with a role in cytokinesis.</p></title><aug><au><snm>Zhang</snm><fnm>H</fnm></au><au><snm>Gomez-Garcia</snm><fnm>MR</fnm></au><au><snm>Shi</snm><fnm>X</fnm></au><au><snm>Rao</snm><fnm>NN</fnm></au><au><snm>Kornberg</snm><fnm>A</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>16486</fpage><lpage>16491</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0706847104</pubid><pubid idtype="pmcid">2034253</pubid><pubid idtype="pmpid">17940044</pubid></pubidlist></xrefbib></bibl><bibl id="B26"><title><p>Disruption of the gene encoding the p34/31 polypeptides affects growth and development of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Bain</snm><fnm>G</fnm></au><au><snm>Tsang</snm><fnm>A</fnm></au></aug><source>Mol Gen Genet</source><pubdate>1991</pubdate><volume>226</volume><fpage>59</fpage><lpage>64</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1007/BF00273587</pubid><pubid idtype="pmpid">1851956</pubid></pubidlist></xrefbib></bibl><bibl id="B27"><title><p>Identification of novel centrosomal proteins in <it>Dictyostelium discoideum </it>by comparative proteomic approaches.</p></title><aug><au><snm>Reinders</snm><fnm>Y</fnm></au><au><snm>Schulz</snm><fnm>I</fnm></au><au><snm>Graf</snm><fnm>R</fnm></au><au><snm>Sickmann</snm><fnm>A</fnm></au></aug><source>J Proteome Res</source><pubdate>2006</pubdate><volume>5</volume><fpage>589</fpage><lpage>598</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1021/pr050350q</pubid><pubid idtype="pmpid" link="fulltext">16512674</pubid></pubidlist></xrefbib></bibl><bibl id="B28"><title><p>Sea anemone genome reveals ancestral eumetazoan gene repertoire and genomic organization.</p></title><aug><au><snm>Putnam</snm><fnm>NH</fnm></au><au><snm>Srivastava</snm><fnm>M</fnm></au><au><snm>Hellsten</snm><fnm>U</fnm></au><au><snm>Dirks</snm><fnm>B</fnm></au><au><snm>Chapman</snm><fnm>J</fnm></au><au><snm>Salamov</snm><fnm>A</fnm></au><au><snm>Terry</snm><fnm>A</fnm></au><au><snm>Shapiro</snm><fnm>H</fnm></au><au><snm>Lindquist</snm><fnm>E</fnm></au><au><snm>Kapitonov</snm><fnm>VV</fnm></au><au><snm>Jurka</snm><fnm>J</fnm></au><au><snm>Genikhovich</snm><fnm>G</fnm></au><au><snm>Grigoriev</snm><fnm>IV</fnm></au><au><snm>Lucas</snm><fnm>SM</fnm></au><au><snm>Steele</snm><fnm>RE</fnm></au><au><snm>Finnerty</snm><fnm>JR</fnm></au><au><snm>Technau</snm><fnm>U</fnm></au><au><snm>Martindale</snm><fnm>MQ</fnm></au><au><snm>Rokhsar</snm><fnm>DS</fnm></au></aug><source>Science</source><pubdate>2007</pubdate><volume>317</volume><fpage>86</fpage><lpage>94</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1139158</pubid><pubid idtype="pmpid" link="fulltext">17615350</pubid></pubidlist></xrefbib></bibl><bibl id="B29"><title><p>Treasure hunt in an amoeba: non-coding RNAs in <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Hinas</snm><fnm>A</fnm></au><au><snm>Soderbom</snm><fnm>F</fnm></au></aug><source>Curr Genet</source><pubdate>2007</pubdate><volume>51</volume><fpage>141</fpage><lpage>159</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1007/s00294-006-0112-z</pubid><pubid idtype="pmpid" link="fulltext">17171561</pubid></pubidlist></xrefbib></bibl><bibl id="B30"><title><p>Novel non-coding RNAs in <it>Dictyostelium discoideum </it>and their expression during development.</p></title><aug><au><snm>Aspegren</snm><fnm>A</fnm></au><au><snm>Hinas</snm><fnm>A</fnm></au><au><snm>Larsson</snm><fnm>P</fnm></au><au><snm>Larsson</snm><fnm>A</fnm></au><au><snm>S&#246;derbom</snm><fnm>F</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2004</pubdate><volume>32</volume><fpage>4646</fpage><lpage>4656</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkh804</pubid><pubid idtype="pmcid">516072</pubid><pubid idtype="pmpid">15333696</pubid></pubidlist></xrefbib></bibl><bibl id="B31"><title><p>Identification of the major spliceosomal RNAs in <it>Dictyostelium discoideum </it>reveals developmentally regulated U2 variants and polyadenylated snRNAs.</p></title><aug><au><snm>Hinas</snm><fnm>A</fnm></au><au><snm>Larsson</snm><fnm>P</fnm></au><au><snm>Avesson</snm><fnm>L</fnm></au><au><snm>Kirsebom</snm><fnm>LA</fnm></au><au><snm>Virtanen</snm><fnm>A</fnm></au><au><snm>Soderbom</snm><fnm>F</fnm></au></aug><source>Eukaryot Cell</source><pubdate>2006</pubdate><volume>5</volume><fpage>924</fpage><lpage>934</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1128/EC.00065-06</pubid><pubid idtype="pmcid">1489274</pubid><pubid idtype="pmpid">16757740</pubid></pubidlist></xrefbib></bibl><bibl id="B32"><title><p>Novel acyl alpha-pyronoids, dictyopyrone A, B, and C, from <it>Dictyostelium </it>cellular slime molds.</p></title><aug><au><snm>Takaya</snm><fnm>Y</fnm></au><au><snm>Kikuchi</snm><fnm>H</fnm></au><au><snm>Terui</snm><fnm>Y</fnm></au><au><snm>Komiya</snm><fnm>J</fnm></au><au><snm>Furukawa</snm><fnm>KI</fnm></au><au><snm>Seya</snm><fnm>K</fnm></au><au><snm>Motomura</snm><fnm>S</fnm></au><au><snm>Ito</snm><fnm>A</fnm></au><au><snm>Oshima</snm><fnm>Y</fnm></au></aug><source>J Org Chem</source><pubdate>2000</pubdate><volume>65</volume><fpage>985</fpage><lpage>989</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1021/jo991338i</pubid><pubid idtype="pmpid" link="fulltext">10814044</pubid></pubidlist></xrefbib></bibl><bibl id="B33"><title><p>Isolation and synthesis of a new aromatic compound, brefelamide, from dictyostelium cellular slime molds and its inhibitory effect on the proliferation of astrocytoma cells.</p></title><aug><au><snm>Kikuchi</snm><fnm>H</fnm></au><au><snm>Saito</snm><fnm>Y</fnm></au><au><snm>Sekiya</snm><fnm>J</fnm></au><au><snm>Okano</snm><fnm>Y</fnm></au><au><snm>Saito</snm><fnm>M</fnm></au><au><snm>Nakahata</snm><fnm>N</fnm></au><au><snm>Kubohara</snm><fnm>Y</fnm></au><au><snm>Oshima</snm><fnm>Y</fnm></au></aug><source>J Org Chem</source><pubdate>2005</pubdate><volume>70</volume><fpage>8854</fpage><lpage>8858</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1021/jo051352x</pubid><pubid idtype="pmpid" link="fulltext">16238318</pubid></pubidlist></xrefbib></bibl><bibl id="B34"><title><p>Polyketide synthase genes and the natural products potential of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Zucko</snm><fnm>J</fnm></au><au><snm>Skunca</snm><fnm>N</fnm></au><au><snm>Curk</snm><fnm>T</fnm></au><au><snm>Zupan</snm><fnm>B</fnm></au><au><snm>Long</snm><fnm>PF</fnm></au><au><snm>Cullum</snm><fnm>J</fnm></au><au><snm>Kessin</snm><fnm>RH</fnm></au><au><snm>Hranueli</snm><fnm>D</fnm></au></aug><source>Bioinformatics</source><pubdate>2007</pubdate><volume>23</volume><fpage>2543</fpage><lpage>2549</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btm381</pubid><pubid idtype="pmpid" link="fulltext">17660200</pubid></pubidlist></xrefbib></bibl><bibl id="B35"><title><p>Dissecting the functional role of polyketide synthases in <it>Dictyostelium discoideum</it>: biosynthesis of the differentiation regulating factor 4-methyl-5-pentylbenzene-1,3-diol.</p></title><aug><au><snm>Ghosh</snm><fnm>R</fnm></au><au><snm>Chhabra</snm><fnm>A</fnm></au><au><snm>Phatale</snm><fnm>PA</fnm></au><au><snm>Samrat</snm><fnm>SK</fnm></au><au><snm>Sharma</snm><fnm>J</fnm></au><au><snm>Gosain</snm><fnm>A</fnm></au><au><snm>Mohanty</snm><fnm>D</fnm></au><au><snm>Saran</snm><fnm>S</fnm></au><au><snm>Gokhale</snm><fnm>RS</fnm></au></aug><source>J Biol Chem</source><pubdate>2008</pubdate><volume>283</volume><fpage>11348</fpage><lpage>11354</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1074/jbc.M709588200</pubid><pubid idtype="pmpid" link="fulltext">18252726</pubid></pubidlist></xrefbib></bibl><bibl id="B36"><title><p>Biosynthesis of <it>Dictyostelium discoideum </it>differentiation-inducing factor by a hybrid type I fatty acid-type III polyketide synthase.</p></title><aug><au><snm>Austin</snm><fnm>MB</fnm></au><au><snm>Saito</snm><fnm>T</fnm></au><au><snm>Bowman</snm><fnm>ME</fnm></au><au><snm>Haydock</snm><fnm>S</fnm></au><au><snm>Kato</snm><fnm>A</fnm></au><au><snm>Moore</snm><fnm>BS</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au><au><snm>Noel</snm><fnm>JP</fnm></au></aug><source>Nat Chem Biol</source><pubdate>2006</pubdate><volume>2</volume><fpage>494</fpage><lpage>502</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nchembio811</pubid><pubid idtype="pmcid">2864586</pubid><pubid idtype="pmpid">16906151</pubid></pubidlist></xrefbib></bibl><bibl id="B37"><title><p>Chemical structure of the morphogen differentiation inducing factor from <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Morris</snm><fnm>HR</fnm></au><au><snm>Taylor</snm><fnm>GW</fnm></au><au><snm>Masento</snm><fnm>MS</fnm></au><au><snm>Jermyn</snm><fnm>KA</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>Nature</source><pubdate>1987</pubdate><volume>328</volume><fpage>811</fpage><lpage>814</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/328811a0</pubid><pubid idtype="pmpid" link="fulltext">3627228</pubid></pubidlist></xrefbib></bibl><bibl id="B38"><title><p>Identification of new differentiation inducing factors from <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Saito</snm><fnm>T</fnm></au><au><snm>Taylor</snm><fnm>GW</fnm></au><au><snm>Yang</snm><fnm>JC</fnm></au><au><snm>Neuhaus</snm><fnm>D</fnm></au><au><snm>Stetsenko</snm><fnm>D</fnm></au><au><snm>Kato</snm><fnm>A</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>Biochim Biophys Acta</source><pubdate>2006</pubdate><volume>1760</volume><fpage>754</fpage><lpage>761</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">16545913</pubid></xrefbib></bibl><bibl id="B39"><title><p>Cell-fate choice in <it>Dictyostelium</it>: intrinsic biases modulate sensitivity to DIF signaling.</p></title><aug><au><snm>Thompson</snm><fnm>CR</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>Dev Biol</source><pubdate>2000</pubdate><volume>227</volume><fpage>56</fpage><lpage>64</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1006/dbio.2000.9877</pubid><pubid idtype="pmpid" link="fulltext">11076676</pubid></pubidlist></xrefbib></bibl><bibl id="B40"><title><p>Chlorine-containing compounds produced during <it>Dictyostelium </it>development - detection by labelling with Cl-36.</p></title><aug><au><snm>Kay</snm><fnm>RR</fnm></au><au><snm>Taylor</snm><fnm>GW</fnm></au><au><snm>Jermyn</snm><fnm>KA</fnm></au><au><snm>Traynor</snm><fnm>D</fnm></au></aug><source>Biochem J</source><pubdate>1992</pubdate><volume>281</volume><fpage>155</fpage><lpage>161</lpage><xrefbib><pubidlist><pubid idtype="pmcid">1130654</pubid><pubid idtype="pmpid">1731750</pubid></pubidlist></xrefbib></bibl><bibl id="B41"><title><p>Facultative cheater mutants reveal the genetic complexity of cooperation in social amoebae.</p></title><aug><au><snm>Santorelli</snm><fnm>LA</fnm></au><au><snm>Thompson</snm><fnm>CR</fnm></au><au><snm>Villegas</snm><fnm>E</fnm></au><au><snm>Svetz</snm><fnm>J</fnm></au><au><snm>Dinh</snm><fnm>C</fnm></au><au><snm>Parikh</snm><fnm>A</fnm></au><au><snm>Sucgang</snm><fnm>R</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au></aug><source>Nature</source><pubdate>2008</pubdate><volume>451</volume><fpage>1107</fpage><lpage>1110</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06558</pubid><pubid idtype="pmpid" link="fulltext">18272966</pubid></pubidlist></xrefbib></bibl><bibl id="B42"><title><p>Natural products as sources of new drugs over the last 25 years.</p></title><aug><au><snm>Newman</snm><fnm>DJ</fnm></au><au><snm>Cragg</snm><fnm>GM</fnm></au></aug><source>J Nat Prod</source><pubdate>2007</pubdate><volume>70</volume><fpage>461</fpage><lpage>477</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1021/np068054v</pubid><pubid idtype="pmpid">17309302</pubid></pubidlist></xrefbib></bibl><bibl id="B43"><title><p>Evolutionary analyses of ABC transporters of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Anjard</snm><fnm>C</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Eukaryot Cell</source><pubdate>2002</pubdate><volume>1</volume><fpage>643</fpage><lpage>652</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1128/EC.1.4.643-652.2002</pubid><pubid idtype="pmcid">117992</pubid><pubid idtype="pmpid">12456012</pubid></pubidlist></xrefbib></bibl><bibl id="B44"><title><p>TagA, a putative serine protease/ABC transporter of <it>Dictyostelium </it>that is required for cell fate determination at the onset of development.</p></title><aug><au><snm>Good</snm><fnm>JR</fnm></au><au><snm>Cabral</snm><fnm>M</fnm></au><au><snm>Sharma</snm><fnm>S</fnm></au><au><snm>Yang</snm><fnm>J</fnm></au><au><snm>Van Driessche</snm><fnm>N</fnm></au><au><snm>Shaw</snm><fnm>CA</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au></aug><source>Development</source><pubdate>2003</pubdate><volume>130</volume><fpage>2953</fpage><lpage>2965</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1242/dev.00523</pubid><pubid idtype="pmpid" link="fulltext">12756178</pubid></pubidlist></xrefbib></bibl><bibl id="B45"><title><p>A multidrug resistance transporter serine protease gene is required for prestalk specialization in <it>Dictyostelium</it>.</p></title><aug><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Genes Dev</source><pubdate>1995</pubdate><volume>9</volume><fpage>1111</fpage><lpage>1122</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gad.9.9.1111</pubid><pubid idtype="pmpid" link="fulltext">7744252</pubid></pubidlist></xrefbib></bibl><bibl id="B46"><title><p>Peptide signaling during terminal differentiation of <it>Dictyostelium</it>.</p></title><aug><au><snm>Anjard</snm><fnm>C</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2005</pubdate><volume>102</volume><fpage>7607</fpage><lpage>7611</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0501820102</pubid><pubid idtype="pmcid">1140433</pubid><pubid idtype="pmpid">15897458</pubid></pubidlist></xrefbib></bibl><bibl id="B47"><title><p>The dictyostelium kinome - analysis of the protein kinases from a simple model organism.</p></title><aug><au><snm>Goldberg</snm><fnm>JM</fnm></au><au><snm>Manning</snm><fnm>G</fnm></au><au><snm>Liu</snm><fnm>A</fnm></au><au><snm>Fey</snm><fnm>P</fnm></au><au><snm>Pilcher</snm><fnm>KE</fnm></au><au><snm>Xu</snm><fnm>Y</fnm></au><au><snm>Smith</snm><fnm>JL</fnm></au></aug><source>PLoS Genet</source><pubdate>2006</pubdate><volume>2</volume><fpage>e38</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pgen.0020038</pubid><pubid idtype="pmcid">1420674</pubid><pubid idtype="pmpid">16596165</pubid></pubidlist></xrefbib></bibl><bibl id="B48"><title><p>An adenylyl cyclase that functions during late development of <it>Dictyostelium</it>.</p></title><aug><au><snm>Soderbom</snm><fnm>F</fnm></au><au><snm>Anjard</snm><fnm>C</fnm></au><au><snm>Iranfar</snm><fnm>N</fnm></au><au><snm>Fuller</snm><fnm>D</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Development</source><pubdate>1999</pubdate><volume>126</volume><fpage>5463</fpage><lpage>5471</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">10556070</pubid></xrefbib></bibl><bibl id="B49"><title><p>Protein kinases share a common structural motif outside the conserved catalytic domain.</p></title><aug><au><snm>Veron</snm><fnm>M</fnm></au><au><snm>Radzio-Andzelm</snm><fnm>E</fnm></au><au><snm>Tsigelny</snm><fnm>I</fnm></au><au><snm>Taylor</snm><fnm>S</fnm></au></aug><source>Cell Mol Biol</source><pubdate>1994</pubdate><volume>40</volume><fpage>587</fpage><lpage>596</lpage><xrefbib><pubid idtype="pmpid">7981616</pubid></xrefbib></bibl><bibl id="B50"><title><p>A new family of transcription factors.</p></title><aug><au><snm>Yamada</snm><fnm>Y</fnm></au><au><snm>Wang</snm><fnm>HY</fnm></au><au><snm>Fukuzawa</snm><fnm>M</fnm></au><au><snm>Barton</snm><fnm>GJ</fnm></au><au><snm>Williams</snm><fnm>JG</fnm></au></aug><source>Development</source><pubdate>2008</pubdate><volume>135</volume><fpage>3093</fpage><lpage>3101</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1242/dev.026377</pubid><pubid idtype="pmpid" link="fulltext">18701541</pubid></pubidlist></xrefbib></bibl><bibl id="B51"><title><p>Sampling gene diversity across the supergroup Amoebozoa: large EST data sets from <it>Acanthamoeba castellanii</it>, <it>Hartmannella vermiformis</it>, <it>Physarum polycephalum</it>, <it>Hyperamoeba dachnaya </it>and <it>Hyperamoeba </it>sp.</p></title><aug><au><snm>Watkins</snm><fnm>RF</fnm></au><au><snm>Gray</snm><fnm>MW</fnm></au></aug><source>Protist</source><pubdate>2008</pubdate><volume>159</volume><fpage>269</fpage><lpage>281</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.protis.2007.12.001</pubid><pubid idtype="pmpid" link="fulltext">18276190</pubid></pubidlist></xrefbib></bibl><bibl id="B52"><title><p>The microfilament system of <it>Dictystelium discoideum</it>.</p></title><aug><au><snm>Rivero</snm><fnm>F</fnm></au><au><snm>Eichinger</snm><fnm>L</fnm></au></aug><source>Dictyostelium Genomics</source><publisher>Norfolk: Horizon Bioscience</publisher><editor>Loomis WF, Kuspa A</editor><pubdate>2005</pubdate><fpage>125</fpage><lpage>172</lpage></bibl><bibl id="B53"><title><p>Rho GTPase signaling in <it>Dictyostelium discoideum</it>: insights from the genome.</p></title><aug><au><snm>Vlahou</snm><fnm>G</fnm></au><au><snm>Rivero</snm><fnm>F</fnm></au></aug><source>Eur J Cell Biol</source><pubdate>2006</pubdate><volume>85</volume><fpage>947</fpage><lpage>959</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.ejcb.2006.04.011</pubid><pubid idtype="pmpid" link="fulltext">16762450</pubid></pubidlist></xrefbib></bibl><bibl id="B54"><title><p>Glycosyltransferase genomics in <it>Dictyostelium</it>.</p></title><aug><au><snm>West</snm><fnm>C</fnm></au><au><snm>van der Wel</snm><fnm>H</fnm></au><au><snm>Coutinho</snm><fnm>PM</fnm></au><au><snm>Henrissat</snm><fnm>B</fnm></au></aug><source>Dictyostelium Genomics</source><publisher>Norfolk: Horizon Bioscience</publisher><editor>Loomis WF, Kuspa A</editor><pubdate>2005</pubdate><fpage>235</fpage><lpage>264</lpage></bibl><bibl id="B55"><title><p>CAZy: Carbohydrate-Active enZYmes Database.</p></title><url>http://www.cazy.org/</url></bibl><bibl id="B56"><title><p>The Carbohydrate-Active EnZymes database (CAZy): an expert resource for Glycogenomics.</p></title><aug><au><snm>Cantarel</snm><fnm>BL</fnm></au><au><snm>Coutinho</snm><fnm>PM</fnm></au><au><snm>Rancurel</snm><fnm>C</fnm></au><au><snm>Bernard</snm><fnm>T</fnm></au><au><snm>Lombard</snm><fnm>V</fnm></au><au><snm>Henrissat</snm><fnm>B</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2009</pubdate><volume>37</volume><fpage>D233</fpage><lpage>238</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkn663</pubid><pubid idtype="pmcid">2686590</pubid><pubid idtype="pmpid">18838391</pubid></pubidlist></xrefbib></bibl><bibl id="B57"><aug><au><snm>Freeze</snm><fnm>HH</fnm></au></aug><source>Dictyostelium discoideum Glycoproteins: Using a Model System for Organismic Glycobiology</source><publisher>Elsevier</publisher><pubdate>1998</pubdate></bibl><bibl id="B58"><title><p>The diversity of dolichol-linked precursors to Asn-linked glycans likely results from secondary loss of sets of glycosyltransferases.</p></title><aug><au><snm>Samuelson</snm><fnm>J</fnm></au><au><snm>Banerjee</snm><fnm>S</fnm></au><au><snm>Magnelli</snm><fnm>P</fnm></au><au><snm>Cui</snm><fnm>J</fnm></au><au><snm>Kelleher</snm><fnm>DJ</fnm></au><au><snm>Gilmore</snm><fnm>R</fnm></au><au><snm>Robbins</snm><fnm>PW</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2005</pubdate><volume>102</volume><fpage>1548</fpage><lpage>1553</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0409460102</pubid><pubid idtype="pmcid">545090</pubid><pubid idtype="pmpid">15665075</pubid></pubidlist></xrefbib></bibl><bibl id="B59"><title><p>Glycopeptidome of a heavily N-glycosylated cell surface glycoprotein of <it>Dictyostelium </it>implicated in cell adhesion.</p></title><aug><au><snm>Feasley</snm><fnm>CL</fnm></au><au><snm>Johnson</snm><fnm>JM</fnm></au><au><snm>West</snm><fnm>CM</fnm></au><au><snm>Chia</snm><fnm>CP</fnm></au></aug><source>J Proteome Res</source><pubdate>2010</pubdate><volume>9</volume><fpage>3495</fpage><lpage>510</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1021/pr901195c</pubid><pubid idtype="pmpid" link="fulltext">20443635</pubid></pubidlist></xrefbib></bibl><bibl id="B60"><title><p>Development of <it>Dictyostelium discoideum </it>is associated with alteration of fucosylated N-glycan structures.</p></title><aug><au><snm>Schiller</snm><fnm>B</fnm></au><au><snm>Hykollari</snm><fnm>A</fnm></au><au><snm>Voglmeir</snm><fnm>J</fnm></au><au><snm>Poltl</snm><fnm>G</fnm></au><au><snm>Hummel</snm><fnm>K</fnm></au><au><snm>Razzazi-Fazeli</snm><fnm>E</fnm></au><au><snm>Geyer</snm><fnm>R</fnm></au><au><snm>Wilson</snm><fnm>IB</fnm></au></aug><source>Biochem J</source><pubdate>2009</pubdate><volume>423</volume><fpage>41</fpage><lpage>52</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1042/BJ20090786</pubid><pubid idtype="pmcid">2851138</pubid><pubid idtype="pmpid">19614564</pubid></pubidlist></xrefbib></bibl><bibl id="B61"><title><p>Evidence for differential cellular adhesion as the mechanism of sorting-out of various cellular slime mold species.</p></title><aug><au><snm>Sternfeld</snm><fnm>J</fnm></au></aug><source>J Embryol Exp Morph</source><pubdate>1979</pubdate><volume>53</volume><fpage>163</fpage><lpage>178</lpage><xrefbib><pubid idtype="pmpid">536686</pubid></xrefbib></bibl><bibl id="B62"><title><p>Initiation of mucin-type O-glycosylation in <it>Dictyostelium </it>is homologous to the corresponding step in animals and is important for spore coat function.</p></title><aug><au><snm>Wang</snm><fnm>F</fnm></au><au><snm>Metcalf</snm><fnm>T</fnm></au><au><snm>van der Wel</snm><fnm>H</fnm></au><au><snm>West</snm><fnm>CM</fnm></au></aug><source>J Biol Chem</source><pubdate>2003</pubdate><volume>278</volume><fpage>51395</fpage><lpage>51407</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1074/jbc.M308756200</pubid><pubid idtype="pmpid" link="fulltext">14551185</pubid></pubidlist></xrefbib></bibl><bibl id="B63"><title><p>Molecular characterization of nucleocytosolic O-GlcNAc transferases of <it>Giardia lamblia </it>and <it>Cryptosporidium parvum</it>.</p></title><aug><au><snm>Banerjee</snm><fnm>S</fnm></au><au><snm>Robbins</snm><fnm>PW</fnm></au><au><snm>Samuelson</snm><fnm>J</fnm></au></aug><source>Glycobiology</source><pubdate>2009</pubdate><volume>19</volume><fpage>331</fpage><lpage>336</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/glycob/cwn107</pubid><pubid idtype="pmcid">2733775</pubid><pubid idtype="pmpid">18948359</pubid></pubidlist></xrefbib></bibl><bibl id="B64"><title><p>A cytoplasmic prolyl hydroxylation and glycosylation pathway modifies Skp1 and regulates O<sub>2</sub>-dependent development in <it>Dictyostelium</it>.</p></title><aug><au><snm>West</snm><fnm>CM</fnm></au><au><snm>Wang</snm><fnm>ZA</fnm></au><au><snm>van der Wel</snm><fnm>H</fnm></au></aug><source>Biochim Biophys Acta</source><pubdate>2010</pubdate><volume>1800</volume><fpage>160</fpage><lpage>171</lpage><xrefbib><pubidlist><pubid idtype="pmcid">2873859</pubid><pubid idtype="pmpid">19914348</pubid></pubidlist></xrefbib></bibl><bibl id="B65"><title><p>Prolyl 4-hydroxylase-1 mediates O2 signaling during development of <it>Dictyostelium</it>.</p></title><aug><au><snm>West</snm><fnm>CM</fnm></au><au><snm>van der Wel</snm><fnm>H</fnm></au><au><snm>Wang</snm><fnm>ZA</fnm></au></aug><source>Development</source><pubdate>2007</pubdate><volume>134</volume><fpage>3349</fpage><lpage>3358</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1242/dev.000893</pubid><pubid idtype="pmpid" link="fulltext">17699611</pubid></pubidlist></xrefbib></bibl><bibl id="B66"><title><p>The evolution of N-glycan-dependent endoplasmic reticulum quality control factors for glycoprotein folding and degradation.</p></title><aug><au><snm>Banerjee</snm><fnm>S</fnm></au><au><snm>Vishwanath</snm><fnm>P</fnm></au><au><snm>Cui</snm><fnm>J</fnm></au><au><snm>Kelleher</snm><fnm>DJ</fnm></au><au><snm>Gilmore</snm><fnm>R</fnm></au><au><snm>Robbins</snm><fnm>PW</fnm></au><au><snm>Samuelson</snm><fnm>J</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>11676</fpage><lpage>11681</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0704862104</pubid><pubid idtype="pmcid">1905923</pubid><pubid idtype="pmpid">17606910</pubid></pubidlist></xrefbib></bibl><bibl id="B67"><title><p>Discoidin proteins of <it>Dictyostelium </it>are necessary for normal cytoskeletal organization and cellular morphology during aggregation.</p></title><aug><au><snm>Alexander</snm><fnm>S</fnm></au><au><snm>Sydow</snm><fnm>LM</fnm></au><au><snm>Wessels</snm><fnm>D</fnm></au><au><snm>Soll</snm><fnm>DR</fnm></au></aug><source>Differentiation</source><pubdate>1992</pubdate><volume>51</volume><fpage>149</fpage><lpage>161</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1432-0436.1992.tb00691.x</pubid><pubid idtype="pmpid">1334012</pubid></pubidlist></xrefbib></bibl><bibl id="B68"><title><p>Loss of the F-actin binding and vesicle-associated protein comitin leads to a phagocytosis defect.</p></title><aug><au><snm>Schreiner</snm><fnm>T</fnm></au><au><snm>Mohrs</snm><fnm>MR</fnm></au><au><snm>Blau-Wasser</snm><fnm>R</fnm></au><au><snm>von Krempelhuber</snm><fnm>A</fnm></au><au><snm>Steinert</snm><fnm>M</fnm></au><au><snm>Schleicher</snm><fnm>M</fnm></au><au><snm>Noegel</snm><fnm>AA</fnm></au></aug><source>Euk Cell</source><pubdate>2003</pubdate><volume>1</volume><fpage>906</fpage><lpage>914</lpage><xrefbib><pubid idtype="doi">10.1128/EC.1.6.906-914.2002</pubid></xrefbib></bibl><bibl id="B69"><title><p>The Ca2+/calcineurin-regulated cup gene family in <it>Dictyostelium discoideum </it>and its possible involvement in development.</p></title><aug><au><snm>Coukell</snm><fnm>B</fnm></au><au><snm>Li</snm><fnm>Y</fnm></au><au><snm>Moniakis</snm><fnm>J</fnm></au><au><snm>Cameron</snm><fnm>A</fnm></au></aug><source>Eukaryot Cell</source><pubdate>2004</pubdate><volume>3</volume><fpage>61</fpage><lpage>71</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1128/EC.3.1.61-71.2004</pubid><pubid idtype="pmcid">329516</pubid><pubid idtype="pmpid">14871937</pubid></pubidlist></xrefbib></bibl><bibl id="B70"><title><p>Structure determination of Discoidin II from <it>Dictyostelium discoideum </it>and carbohydrate binding properties of the lectin domain.</p></title><aug><au><snm>Aragao</snm><fnm>KS</fnm></au><au><snm>Satre</snm><fnm>M</fnm></au><au><snm>Imberty</snm><fnm>A</fnm></au><au><snm>Varrot</snm><fnm>A</fnm></au></aug><source>Proteins</source><pubdate>2008</pubdate><volume>73</volume><fpage>43</fpage><lpage>52</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1002/prot.22038</pubid><pubid idtype="pmpid" link="fulltext">18384150</pubid></pubidlist></xrefbib></bibl><bibl id="B71"><title><p>The role of lineage-specific gene family expansion in the evolution of eukaryotes.</p></title><aug><au><snm>Lespinet</snm><fnm>O</fnm></au><au><snm>Wolf</snm><fnm>YI</fnm></au><au><snm>Koonin</snm><fnm>EV</fnm></au><au><snm>Aravind</snm><fnm>L</fnm></au></aug><source>Genome Res</source><pubdate>2002</pubdate><volume>12</volume><fpage>1048</fpage><lpage>1059</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.174302</pubid><pubid idtype="pmcid">186617</pubid><pubid idtype="pmpid">12097341</pubid></pubidlist></xrefbib></bibl><bibl id="B72"><title><p>The xi spore germination-specific cellulase is organized into functional domains.</p></title><aug><au><snm>Ramalingam</snm><fnm>R</fnm></au><au><snm>Blume</snm><fnm>JE</fnm></au><au><snm>Ennis</snm><fnm>HL</fnm></au></aug><source>J Bacteriol</source><pubdate>1992</pubdate><volume>174</volume><fpage>7834</fpage><lpage>7783</lpage><xrefbib><pubidlist><pubid idtype="pmcid">207501</pubid><pubid idtype="pmpid">1447151</pubid></pubidlist></xrefbib></bibl><bibl id="B73"><title><p>Polymorphic members of the lag-gene family mediate kin-discrimination in <it>Dictyostelium</it>.</p></title><aug><au><snm>Benabentos</snm><fnm>R</fnm></au><au><snm>Hirose</snm><fnm>S</fnm></au><au><snm>Sucgang</snm><fnm>R</fnm></au><au><snm>Curk</snm><fnm>T</fnm></au><au><snm>Katoh</snm><fnm>M</fnm></au><au><snm>Ostrowski</snm><fnm>E</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au><au><snm>Zupan</snm><fnm>DC</fnm></au><au><snm>Shaulsky</snm><fnm>G</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au></aug><source>Curr Biol</source><pubdate>2009</pubdate><volume>19</volume><fpage>567</fpage><lpage>572</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.cub.2009.02.037</pubid><pubid idtype="pmcid">2694408</pubid><pubid idtype="pmpid">19285397</pubid></pubidlist></xrefbib></bibl><bibl id="B74"><title><p>Immune-like phagocyte activity in the social amoeba.</p></title><aug><au><snm>Chen</snm><fnm>G</fnm></au><au><snm>Zhuchenko</snm><fnm>O</fnm></au><au><snm>Kuspa</snm><fnm>A</fnm></au></aug><source>Science</source><pubdate>2007</pubdate><volume>317</volume><fpage>678</fpage><lpage>681</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1143991</pubid><pubid idtype="pmpid" link="fulltext">17673666</pubid></pubidlist></xrefbib></bibl><bibl id="B75"><title><p>Fingerprinting of adenylyl cyclase activities during <it>Dictyostelium </it>development indicates a dominant role for adenylyl cyclase B in terminal differentiation.</p></title><aug><au><snm>Meima</snm><fnm>ME</fnm></au><au><snm>Schaap</snm><fnm>P</fnm></au></aug><source>Dev Biol</source><pubdate>1999</pubdate><volume>212</volume><fpage>182</fpage><lpage>190</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1006/dbio.1999.9352</pubid><pubid idtype="pmpid" link="fulltext">10419694</pubid></pubidlist></xrefbib></bibl><bibl id="B76"><title><p>cAMP signaling in <it>Dictyostelium </it>- complexity of cAMP synthesis, degradation and detection.</p></title><aug><au><snm>Saran</snm><fnm>S</fnm></au><au><snm>Meima</snm><fnm>ME</fnm></au><au><snm>Alvarez-Curto</snm><fnm>E</fnm></au><au><snm>Weening</snm><fnm>KE</fnm></au><au><snm>Rozen</snm><fnm>DE</fnm></au><au><snm>Schaap</snm><fnm>P</fnm></au></aug><source>J Muscle Res Cell Motil</source><pubdate>2002</pubdate><volume>23</volume><fpage>793</fpage><lpage>802</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1023/A:1024483829878</pubid><pubid idtype="pmpid" link="fulltext">12952077</pubid></pubidlist></xrefbib></bibl><bibl id="B77"><title><p>Four key signaling pathways mediating chemotaxis in <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Veltman</snm><fnm>DM</fnm></au><au><snm>Keizer-Gunnik</snm><fnm>I</fnm></au><au><snm>Van Haastert</snm><fnm>PJ</fnm></au></aug><source>J Cell Biol</source><pubdate>2008</pubdate><volume>180</volume><fpage>747</fpage><lpage>753</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1083/jcb.200709180</pubid><pubid idtype="pmcid">2265585</pubid><pubid idtype="pmpid">18299345</pubid></pubidlist></xrefbib></bibl><bibl id="B78"><title><p>Adenylyl cyclase expression and regulation during the differentiation of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Kriebel</snm><fnm>PW</fnm></au><au><snm>Parent</snm><fnm>CA</fnm></au></aug><source>IUBMB Life</source><pubdate>2004</pubdate><volume>56</volume><fpage>541</fpage><lpage>546</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1080/15216540400013887</pubid><pubid idtype="pmpid" link="fulltext">15590560</pubid></pubidlist></xrefbib></bibl><bibl id="B79"><title><p>Activated cAMP receptors switch encystation into sporulation.</p></title><aug><au><snm>Kawabe</snm><fnm>Y</fnm></au><au><snm>Morio</snm><fnm>T</fnm></au><au><snm>James</snm><fnm>JL</fnm></au><au><snm>Prescott</snm><fnm>AR</fnm></au><au><snm>Tanaka</snm><fnm>Y</fnm></au><au><snm>Schaap</snm><fnm>P</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2009</pubdate><volume>106</volume><fpage>7089</fpage><lpage>7094</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0901617106</pubid><pubid idtype="pmcid">2678454</pubid><pubid idtype="pmpid">19369200</pubid></pubidlist></xrefbib></bibl><bibl id="B80"><title><p>Seven <it>Dictyostelium discoideum </it>phosphodiesterases degrade three pools of cAMP and cGMP.</p></title><aug><au><snm>Bader</snm><fnm>S</fnm></au><au><snm>Kortholt</snm><fnm>A</fnm></au><au><snm>Van Haastert</snm><fnm>PJ</fnm></au></aug><source>Biochem J</source><pubdate>2007</pubdate><volume>402</volume><fpage>153</fpage><lpage>161</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1042/BJ20061153</pubid><pubid idtype="pmcid">1783984</pubid><pubid idtype="pmpid">17040207</pubid></pubidlist></xrefbib></bibl><bibl id="B81"><title><p>RasGEF-containing proteins GbpC and GbpD have differential effects on cell polarity and chemotaxis in <it>Dictyostelium</it>.</p></title><aug><au><snm>Bosgraaf</snm><fnm>L</fnm></au><au><snm>Waijer</snm><fnm>A</fnm></au><au><snm>Engel</snm><fnm>R</fnm></au><au><snm>Visser</snm><fnm>AJ</fnm></au><au><snm>Wessels</snm><fnm>D</fnm></au><au><snm>Soll</snm><fnm>D</fnm></au><au><snm>van Haastert</snm><fnm>PJ</fnm></au></aug><source>J Cell Sci</source><pubdate>2005</pubdate><volume>118</volume><fpage>1899</fpage><lpage>1910</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1242/jcs.02317</pubid><pubid idtype="pmpid" link="fulltext">15827084</pubid></pubidlist></xrefbib></bibl><bibl id="B82"><title><p>Intramolecular activation mechanism of the <it>Dictyostelium </it>LRRK2 homolog Roco protein GbpC.</p></title><aug><au><snm>van Egmond</snm><fnm>WN</fnm></au><au><snm>Kortholt</snm><fnm>A</fnm></au><au><snm>Plak</snm><fnm>K</fnm></au><au><snm>Bosgraaf</snm><fnm>L</fnm></au><au><snm>Bosgraaf</snm><fnm>S</fnm></au><au><snm>Keizer-Gunnink</snm><fnm>I</fnm></au><au><snm>van Haastert</snm><fnm>PJ</fnm></au></aug><source>J Biol Chem</source><pubdate>2008</pubdate><volume>283</volume><fpage>30412</fpage><lpage>30420</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1074/jbc.M804265200</pubid><pubid idtype="pmcid">2662088</pubid><pubid idtype="pmpid">18703517</pubid></pubidlist></xrefbib></bibl><bibl id="B83"><title><p>The biosynthesis of differentiation-inducing factor, a chlorinated signal molecule regulating <it>Dictyostelium </it>development.</p></title><aug><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>J Biol Chem</source><pubdate>1998</pubdate><volume>273</volume><fpage>2669</fpage><lpage>2675</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1074/jbc.273.5.2669</pubid><pubid idtype="pmpid" link="fulltext">9446571</pubid></pubidlist></xrefbib></bibl><bibl id="B84"><title><p>The role of DIF-1 signaling in <it>Dictyostelium </it>development.</p></title><aug><au><snm>Thompson</snm><fnm>CR</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>Mol Cell</source><pubdate>2000</pubdate><volume>6</volume><fpage>1509</fpage><lpage>1514</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/S1097-2765(00)00147-7</pubid><pubid idtype="pmpid" link="fulltext">11163223</pubid></pubidlist></xrefbib></bibl><bibl id="B85"><title><p>Differentiation-inducing-factor dechlorinase, a novel cytosolic dechlorinating enzyme from <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Nayler</snm><fnm>O</fnm></au><au><snm>Insall</snm><fnm>R</fnm></au><au><snm>Kay</snm><fnm>RR</fnm></au></aug><source>Eur J Biochem</source><pubdate>1992</pubdate><volume>208</volume><fpage>531</fpage><lpage>536</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1432-1033.1992.tb17217.x</pubid><pubid idtype="pmpid" link="fulltext">1521542</pubid></pubidlist></xrefbib></bibl><bibl id="B86"><title><p>High relatedness maintains multicellular cooperation in a social amoeba by controlling cheater mutants.</p></title><aug><au><snm>Gilbert</snm><fnm>OM</fnm></au><au><snm>Foster</snm><fnm>KR</fnm></au><au><snm>Mehdiabadi</snm><fnm>NJ</fnm></au><au><snm>Strassmann</snm><fnm>JE</fnm></au><au><snm>Queller</snm><fnm>DC</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>8913</fpage><lpage>8917</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0702723104</pubid><pubid idtype="pmcid">1885602</pubid><pubid idtype="pmpid">17496139</pubid></pubidlist></xrefbib></bibl><bibl id="B87"><title><p>The power of phylogenetic comparison in revealing protein function.</p></title><aug><au><snm>Yang</snm><fnm>Z</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2005</pubdate><volume>102</volume><fpage>3179</fpage><lpage>3180</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0500371102</pubid><pubid idtype="pmcid">552944</pubid><pubid idtype="pmpid">15728394</pubid></pubidlist></xrefbib></bibl><bibl id="B88"><title><p>The prisoner's dilemma and polymorphism in yeast SUC genes.</p></title><aug><au><snm>Greig</snm><fnm>D</fnm></au><au><snm>Travisano</snm><fnm>M</fnm></au></aug><source>Proc Biol Sci</source><pubdate>2004</pubdate><volume>271</volume><issue>Suppl 3</issue><fpage>S25</fpage><lpage>26</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1098/rsbl.2003.0083</pubid><pubid idtype="pmcid">1810003</pubid><pubid idtype="pmpid">15101409</pubid></pubidlist></xrefbib></bibl><bibl id="B89"><title><p>High frequency recombination during the sexual cycle of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Francis</snm><fnm>D</fnm></au></aug><source>Genetics</source><pubdate>1998</pubdate><volume>148</volume><fpage>1829</fpage><lpage>1832</lpage><xrefbib><pubidlist><pubid idtype="pmcid">1460078</pubid><pubid idtype="pmpid">9560397</pubid></pubidlist></xrefbib></bibl><bibl id="B90"><title><p>Genetic exchanges in the macrocysts of <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Wallace</snm><fnm>MA</fnm></au><au><snm>Raper</snm><fnm>KB</fnm></au></aug><source>J Gen Microbiol</source><pubdate>1979</pubdate><volume>113</volume><fpage>327</fpage><lpage>337</lpage><xrefbib><pubid idtype="pmpid">292755</pubid></xrefbib></bibl><bibl id="B91"><title><p>Genetic structure of a natural population of <it>Dictyostelium discoideum</it>, a cellular slime mold.</p></title><aug><au><snm>Francis</snm><fnm>D</fnm></au><au><snm>Eisenberg</snm><fnm>R</fnm></au></aug><source>Mol Ecol</source><pubdate>1993</pubdate><volume>2</volume><fpage>385</fpage><lpage>392</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1365-294X.1993.tb00031.x</pubid><pubid idtype="pmpid">7909262</pubid></pubidlist></xrefbib></bibl><bibl id="B92"><title><p>Construction of a gamete-enriched gene pool and RNAi-mediated functional analysis in <it>Dictyostelium discoideum</it>.</p></title><aug><au><snm>Muramoto</snm><fnm>T</fnm></au><au><snm>Suzuki</snm><fnm>K</fnm></au><au><snm>Shimizu</snm><fnm>H</fnm></au><au><snm>Kohara</snm><fnm>Y</fnm></au><au><snm>Kohriki</snm><fnm>E</fnm></au><au><snm>Obara</snm><fnm>S</fnm></au><au><snm>Tanaka</snm><fnm>Y</fnm></au><au><snm>Urushihara</snm><fnm>H</fnm></au></aug><source>Mech Dev</source><pubdate>2003</pubdate><volume>120</volume><fpage>965</fpage><lpage>975</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/S0925-4773(03)00136-9</pubid><pubid idtype="pmpid" link="fulltext">12963116</pubid></pubidlist></xrefbib></bibl><bibl id="B93"><title><p>An expanded inventory of conserved meiotic genes provides evidence for sex in <it>Trichomonas vaginalis</it>.</p></title><aug><au><snm>Malik</snm><fnm>SB</fnm></au><au><snm>Pightling</snm><fnm>AW</fnm></au><au><snm>Stefaniak</snm><fnm>LM</fnm></au><au><snm>Schurko</snm><fnm>AM</fnm></au><au><snm>Logsdon</snm><fnm>JM</fnm><suf>Jr</suf></au></aug><source>PLoS ONE</source><pubdate>2007</pubdate><volume>3</volume><fpage>e2879</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pone.0002879</pubid><pubid idtype="pmcid">2488364</pubid><pubid idtype="pmpid">18663385</pubid></pubidlist></xrefbib></bibl><bibl id="B94"><title><p>Monograph of the Acrasieae.</p></title><aug><au><snm>Olive</snm><fnm>EW</fnm></au></aug><source>Proc Boston Soc Natur Hist</source><pubdate>1902</pubdate><volume>30</volume><fpage>451</fpage><lpage>513</lpage></bibl><bibl id="B95"><title><p>Cultivation and synchronous morphogenesis of <it>Dictyostelium </it>under controlled experimental conditions.</p></title><aug><au><snm>Sussman</snm><fnm>M</fnm></au></aug><source>Methods Cell Biol</source><pubdate>1987</pubdate><volume>28</volume><fpage>9</fpage><lpage>29</lpage><xrefbib><pubidlist><pubid idtype="doi">full_text</pubid><pubid idtype="pmpid">3298997</pubid></pubidlist></xrefbib></bibl><bibl id="B96"><title><p>Human whole-genome shotgun sequencing.</p></title><aug><au><snm>Weber</snm><fnm>JL</fnm></au><au><snm>Myers</snm><fnm>EW</fnm></au></aug><source>Genome Res</source><pubdate>1997</pubdate><volume>7</volume><fpage>401</fpage><lpage>409</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">9149936</pubid></xrefbib></bibl><bibl id="B97"><title><p>Base-calling of automated sequencer traces using phred. I. Accuracy assessment.</p></title><aug><au><snm>Ewing</snm><fnm>B</fnm></au><au><snm>Hillier</snm><fnm>L</fnm></au><au><snm>Wendl</snm><fnm>MC</fnm></au><au><snm>Green</snm><fnm>P</fnm></au></aug><source>Genome Res</source><pubdate>1998</pubdate><volume>8</volume><fpage>175</fpage><lpage>185</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">9521921</pubid></xrefbib></bibl><bibl id="B98"><title><p>Whole-genome shotgun assembly and analysis of the genome of <it>Fugu rubripes</it>.</p></title><aug><au><snm>Aparicio</snm><fnm>S</fnm></au><au><snm>Chapman</snm><fnm>J</fnm></au><au><snm>Stupka</snm><fnm>E</fnm></au><au><snm>Putnam</snm><fnm>N</fnm></au><au><snm>Chia</snm><fnm>JM</fnm></au><au><snm>Dehal</snm><fnm>P</fnm></au><au><snm>Christoffels</snm><fnm>A</fnm></au><au><snm>Rash</snm><fnm>S</fnm></au><au><snm>Hoon</snm><fnm>S</fnm></au><au><snm>Smit</snm><fnm>A</fnm></au><au><snm>Gelpke</snm><fnm>MD</fnm></au><au><snm>Roach</snm><fnm>J</fnm></au><au><snm>Oh</snm><fnm>T</fnm></au><au><snm>Ho</snm><fnm>IY</fnm></au><au><snm>Wong</snm><fnm>M</fnm></au><au><snm>Detter</snm><fnm>C</fnm></au><au><snm>Verhoef</snm><fnm>F</fnm></au><au><snm>Predki</snm><fnm>P</fnm></au><au><snm>Tay</snm><fnm>A</fnm></au><au><snm>Lucas</snm><fnm>S</fnm></au><au><snm>Richardson</snm><fnm>P</fnm></au><au><snm>Smith</snm><fnm>SF</fnm></au><au><snm>Clark</snm><fnm>MS</fnm></au><au><snm>Edwards</snm><fnm>YJ</fnm></au><au><snm>Doggett</snm><fnm>N</fnm></au><au><snm>Zharkikh</snm><fnm>A</fnm></au><au><snm>Tavtigian</snm><fnm>SV</fnm></au><au><snm>Pruss</snm><fnm>D</fnm></au><au><snm>Barnstead</snm><fnm>M</fnm></au><au><snm>Evans</snm><fnm>C</fnm></au><etal/></aug><source>Science</source><pubdate>2002</pubdate><volume>297</volume><fpage>1301</fpage><lpage>1310</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1072104</pubid><pubid idtype="pmpid" link="fulltext">12142439</pubid></pubidlist></xrefbib></bibl><bibl id="B99"><title><p>Pfam.</p></title><url>http://pfam.sanger.ac.uk/</url></bibl><bibl id="B100"><title><p>Ensembl.</p></title><url>http://uswest.ensembl.org/</url></bibl><bibl id="B101"><title><p>The amphioxus genome and the evolution of the chordate karyotype.</p></title><aug><au><snm>Putnam</snm><fnm>NH</fnm></au><au><snm>Butts</snm><fnm>T</fnm></au><au><snm>Ferrier</snm><fnm>DE</fnm></au><au><snm>Furlong</snm><fnm>RF</fnm></au><au><snm>Hellsten</snm><fnm>U</fnm></au><au><snm>Kawashima</snm><fnm>T</fnm></au><au><snm>Robinson-Rechavi</snm><fnm>M</fnm></au><au><snm>Shoguchi</snm><fnm>E</fnm></au><au><snm>Terry</snm><fnm>A</fnm></au><au><snm>Yu</snm><fnm>JK</fnm></au><au><snm>Benito-Guti&#233;rrez</snm><fnm>EL</fnm></au><au><snm>Dubchak</snm><fnm>I</fnm></au><au><snm>Garcia-Fern&#224;ndez</snm><fnm>J</fnm></au><au><snm>Gibson-Brown</snm><fnm>JJ</fnm></au><au><snm>Grigoriev</snm><fnm>IV</fnm></au><au><snm>Horton</snm><fnm>AC</fnm></au><au><snm>de Jong</snm><fnm>PJ</fnm></au><au><snm>Jurka</snm><fnm>J</fnm></au><au><snm>Kapitonov</snm><fnm>VV</fnm></au><au><snm>Kohara</snm><fnm>Y</fnm></au><au><snm>Kuroki</snm><fnm>Y</fnm></au><au><snm>Lindquist</snm><fnm>E</fnm></au><au><snm>Lucas</snm><fnm>S</fnm></au><au><snm>Osoegawa</snm><fnm>K</fnm></au><au><snm>Pennacchio</snm><fnm>LA</fnm></au><au><snm>Salamov</snm><fnm>AA</fnm></au><au><snm>Satou</snm><fnm>Y</fnm></au><au><snm>Sauka-Spengler</snm><fnm>T</fnm></au><au><snm>Schmutz</snm><fnm>J</fnm></au><au><snm>Shin-I</snm><fnm>T</fnm></au><etal/></aug><source>Nature</source><pubdate>2008</pubdate><volume>453</volume><fpage>1064</fpage><lpage>1071</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06967</pubid><pubid idtype="pmpid" link="fulltext">18563158</pubid></pubidlist></xrefbib></bibl><bibl id="B102"><title><p>Neurospora crassa Database.</p></title><url>http://www.broadinstitute.org/annotation/genome/neurospora/MultiHome.html</url></bibl><bibl id="B103"><title><p>TAIR.</p></title><url>http://www.arabidopsis.org/</url></bibl><bibl id="B104"><title><p>The <it>Chlamydomonas </it>genome reveals the evolution of key animal and plant functions.</p></title><aug><au><snm>Merchant</snm><fnm>SS</fnm></au><au><snm>Prochnik</snm><fnm>SE</fnm></au><au><snm>Vallon</snm><fnm>O</fnm></au><au><snm>Harris</snm><fnm>EH</fnm></au><au><snm>Karpowicz</snm><fnm>SJ</fnm></au><au><snm>Witman</snm><fnm>GB</fnm></au><au><snm>Terry</snm><fnm>A</fnm></au><au><snm>Salamov</snm><fnm>A</fnm></au><au><snm>Fritz-Laylin</snm><fnm>LK</fnm></au><au><snm>Mar&#233;chal-Drouard</snm><fnm>L</fnm></au><au><snm>Marshall</snm><fnm>WF</fnm></au><au><snm>Qu</snm><fnm>LH</fnm></au><au><snm>Nelson</snm><fnm>DR</fnm></au><au><snm>Sanderfoot</snm><fnm>AA</fnm></au><au><snm>Spalding</snm><fnm>MH</fnm></au><au><snm>Kapitonov</snm><fnm>VV</fnm></au><au><snm>Ren</snm><fnm>Q</fnm></au><au><snm>Ferris</snm><fnm>P</fnm></au><au><snm>Lindquist</snm><fnm>E</fnm></au><au><snm>Shapiro</snm><fnm>H</fnm></au><au><snm>Lucas</snm><fnm>SM</fnm></au><au><snm>Grimwood</snm><fnm>J</fnm></au><au><snm>Schmutz</snm><fnm>J</fnm></au><au><snm>Cardol</snm><fnm>P</fnm></au><au><snm>Cerutti</snm><fnm>H</fnm></au><au><snm>Chanfreau</snm><fnm>G</fnm></au><au><snm>Chen</snm><fnm>CL</fnm></au><au><snm>Cognat</snm><fnm>V</fnm></au><au><snm>Croft</snm><fnm>MT</fnm></au><au><snm>Dent</snm><fnm>R</fnm></au></aug><source>Science</source><pubdate>2007</pubdate><volume>318</volume><fpage>245</fpage><lpage>250</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1143609</pubid><pubid idtype="pmcid">2875087</pubid><pubid idtype="pmpid">17932292</pubid></pubidlist></xrefbib></bibl><bibl id="B105"><title><p>SMART, a simple modular architecture research tool: identification of signaling domains.</p></title><aug><au><snm>Schultz</snm><fnm>J</fnm></au><au><snm>Milpetz</snm><fnm>F</fnm></au><au><snm>Bork</snm><fnm>P</fnm></au><au><snm>Ponting</snm><fnm>CP</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>1998</pubdate><volume>95</volume><fpage>5857</fpage><lpage>5864</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.95.11.5857</pubid><pubid idtype="pmcid">34487</pubid><pubid idtype="pmpid">9600884</pubid></pubidlist></xrefbib></bibl><bibl id="B106"><title><p>Multiple sequence alignment with the Clustal series of programs.</p></title><aug><au><snm>Chenna</snm><fnm>R</fnm></au><au><snm>Sugawara</snm><fnm>H</fnm></au><au><snm>Koike</snm><fnm>T</fnm></au><au><snm>Lopez</snm><fnm>R</fnm></au><au><snm>Gibson</snm><fnm>TJ</fnm></au><au><snm>Higgins</snm><fnm>DG</fnm></au><au><snm>Thompson</snm><fnm>JD</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2003</pubdate><volume>31</volume><fpage>3497</fpage><lpage>3500</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkg500</pubid><pubid idtype="pmcid">168907</pubid><pubid idtype="pmpid">12824352</pubid></pubidlist></xrefbib></bibl><bibl id="B107"><title><p>Bioedit: a user-friendly biological sequence alignment editor and analysis program fro Windows 95/98/NT.</p></title><aug><au><snm>Hall</snm><fnm>TA</fnm></au></aug><source>Nucleic Acids Symp Ser</source><pubdate>1999</pubdate><volume>41</volume><fpage>95</fpage><lpage>98</lpage></bibl><bibl id="B108"><title><p>MrBayes 3: Bayesian phylogenetic inference under mixed models.</p></title><aug><au><snm>Ronquist</snm><fnm>F</fnm></au><au><snm>Huelsenbeck</snm><fnm>JP</fnm></au></aug><source>Bioinformatics</source><pubdate>2003</pubdate><volume>19</volume><fpage>1572</fpage><lpage>1574</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btg180</pubid><pubid idtype="pmpid" link="fulltext">12912839</pubid></pubidlist></xrefbib></bibl><bibl id="B109"><title><p>Comparative analysis of amino acid repeats in rodents and humans.</p></title><aug><au><snm>Alba</snm><fnm>MM</fnm></au><au><snm>Guigo</snm><fnm>R</fnm></au></aug><source>Genome Res</source><pubdate>2004</pubdate><volume>14</volume><fpage>549</fpage><lpage>554</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.1925704</pubid><pubid idtype="pmcid">383298</pubid><pubid idtype="pmpid">15059995</pubid></pubidlist></xrefbib></bibl><bibl id="B110"><title><p>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence.</p></title><aug><au><snm>Lowe</snm><fnm>TM</fnm></au><au><snm>Eddy</snm><fnm>SR</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>1997</pubdate><volume>25</volume><fpage>955</fpage><lpage>964</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/25.5.955</pubid><pubid idtype="pmcid">146525</pubid><pubid idtype="pmpid">9023104</pubid></pubidlist></xrefbib></bibl><bibl id="B111"><title><p>The small RNA repertoire of <it>Dictyostelium discoideum </it>and its regulation by components of the RNAi pathway.</p></title><aug><au><snm>Hinas</snm><fnm>A</fnm></au><au><snm>Reimegard</snm><fnm>J</fnm></au><au><snm>Wagner</snm><fnm>EG</fnm></au><au><snm>Nellen</snm><fnm>W</fnm></au><au><snm>Ambros</snm><fnm>VR</fnm></au><au><snm>Soderbom</snm><fnm>F</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2007</pubdate><volume>35</volume><fpage>6714</fpage><lpage>6726</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkm707</pubid><pubid idtype="pmcid">2175303</pubid><pubid idtype="pmpid">17916577</pubid></pubidlist></xrefbib></bibl><bibl id="B112"><title><p>Protein coding regions of the D. purpureum genome.</p></title><url>ftp://ftp.jgi-psf.org/pub/JGI_data/Dictyostelium_purpureum/v1.0/annotation/Dicpu1_best_genes.gff.gz</url></bibl><bibl id="B113"><title><p>Protein coding regions of the D. disdoideum genome.</p></title><url>http://dictybase.org/download/gff3/dicty_gff3_10212009.zip</url></bibl><bibl id="B114"><title><p>LocARNA.</p></title><url>http://rna.tbi.univie.ac.at/cgi-bin/LocARNA.cgi</url></bibl><bibl id="B115"><title><p>RNALogo: CreateLogo.</p></title><url>http://rnalogo.mbc.nctu.edu.tw/createlogo.html</url></bibl><bibl id="B116"><title><p>Automatic clustering of orthologs and in-paralogs from pairwise species comparisons.</p></title><aug><au><snm>Remm</snm><fnm>M</fnm></au><au><snm>Storm</snm><fnm>CE</fnm></au><au><snm>Sonnhammer</snm><fnm>EL</fnm></au></aug><source>J Mol Biol</source><pubdate>2001</pubdate><volume>314</volume><fpage>1041</fpage><lpage>1052</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1006/jmbi.2000.5197</pubid><pubid idtype="pmpid" link="fulltext">11743721</pubid></pubidlist></xrefbib></bibl><bibl id="B117"><title><p>The Pfam protein families database.</p></title><aug><au><snm>Finn</snm><fnm>RD</fnm></au><au><snm>Tate</snm><fnm>J</fnm></au><au><snm>Mistry</snm><fnm>J</fnm></au><au><snm>Coggill</snm><fnm>PC</fnm></au><au><snm>Sammut</snm><fnm>SJ</fnm></au><au><snm>Hotz</snm><fnm>HR</fnm></au><au><snm>Ceric</snm><fnm>G</fnm></au><au><snm>Forslund</snm><fnm>K</fnm></au><au><snm>Eddy</snm><fnm>SR</fnm></au><au><snm>Sonnhammer</snm><fnm>EL</fnm></au><au><snm>Bateman</snm><fnm>A</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2008</pubdate><issue>36 Database</issue><fpage>D281</fpage><lpage>288</lpage><xrefbib><pubidlist><pubid idtype="pmcid">2238907</pubid><pubid idtype="pmpid">18039703</pubid></pubidlist></xrefbib></bibl><bibl id="B118"><title><p>MUSCLE: multiple sequence alignment with high accuracy and high throughput.</p></title><aug><au><snm>Edgar</snm><fnm>RC</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2004</pubdate><volume>32</volume><fpage>1792</fpage><lpage>1797</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkh340</pubid><pubid idtype="pmcid">390337</pubid><pubid idtype="pmpid">15034147</pubid></pubidlist></xrefbib></bibl><bibl id="B119"><title><p>MEGA4: Molecular Evolutionary Genetics Analysis (MEGA) software version 4.0.</p></title><aug><au><snm>Tamura</snm><fnm>K</fnm></au><au><snm>Dudley</snm><fnm>J</fnm></au><au><snm>Nei</snm><fnm>M</fnm></au><au><snm>Kumar</snm><fnm>S</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2007</pubdate><volume>24</volume><fpage>1596</fpage><lpage>1599</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msm092</pubid><pubid idtype="pmpid" link="fulltext">17488738</pubid></pubidlist></xrefbib></bibl><bibl id="B120"><title><p>Polyketide synthase gene analyses.</p></title><url>http://www.mrc-lmb.cam.ac.uk/genomes/madanm/rrk</url></bibl><bibl id="B121"><title><p>Molecular tinkering of G protein-coupled receptors: an evolutionary success.</p></title><aug><au><snm>Bockaert</snm><fnm>J</fnm></au><au><snm>Pin</snm><fnm>JP</fnm></au></aug><source>EMBO J</source><pubdate>1999</pubdate><volume>18</volume><fpage>1723</fpage><lpage>1729</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/emboj/18.7.1723</pubid><pubid idtype="pmcid">1171258</pubid><pubid idtype="pmpid">10202136</pubid></pubidlist></xrefbib></bibl><bibl id="B122"><title><p>The <it>Dictyostelium </it>repertoire of seven transmembrane domain receptors.</p></title><aug><au><snm>Prabhu</snm><fnm>Y</fnm></au><au><snm>Eichinger</snm><fnm>L</fnm></au></aug><source>Eur J Cell Biol</source><pubdate>2006</pubdate><volume>85</volume><fpage>937</fpage><lpage>946</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.ejcb.2006.04.003</pubid><pubid idtype="pmpid" link="fulltext">16735079</pubid></pubidlist></xrefbib></bibl><bibl id="B123"><title><p>Two novel GPCR-type G proteins are abscisic acid receptors in <it>Arabidopsis</it>.</p></title><aug><au><snm>Pandey</snm><fnm>S</fnm></au><au><snm>Nelson</snm><fnm>DC</fnm></au><au><snm>Assmann</snm><fnm>SM</fnm></au></aug><source>Cell</source><pubdate>2009</pubdate><volume>136</volume><fpage>136</fpage><lpage>148</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.cell.2008.12.026</pubid><pubid idtype="pmpid" link="fulltext">19135895</pubid></pubidlist></xrefbib></bibl><bibl id="B124"><title><p>Evolution of key cell signaling and adhesion protein families predates animal origins.</p></title><aug><au><snm>King</snm><fnm>N</fnm></au><au><snm>Hittinger</snm><fnm>CT</fnm></au><au><snm>Carroll</snm><fnm>SB</fnm></au></aug><source>Science</source><pubdate>2003</pubdate><volume>301</volume><fpage>361</fpage><lpage>363</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1083853</pubid><pubid idtype="pmpid" link="fulltext">12869759</pubid></pubidlist></xrefbib></bibl><bibl id="B125"><title><p>The actinome of <it>Dictyostelium discoideum </it>in comparison to actins and actin-related proteins from other organisms.</p></title><aug><au><snm>Joseph</snm><fnm>JM</fnm></au><au><snm>Fey</snm><fnm>P</fnm></au><au><snm>Ramalingam</snm><fnm>N</fnm></au><au><snm>Liu</snm><fnm>XI</fnm></au><au><snm>Rohlfs</snm><fnm>M</fnm></au><au><snm>Noegel</snm><fnm>AA</fnm></au><au><snm>Muller-Taubenberger</snm><fnm>A</fnm></au><au><snm>Glockner</snm><fnm>G</fnm></au><au><snm>Schleicher</snm><fnm>M</fnm></au></aug><source>PLoS ONE</source><pubdate>2008</pubdate><volume>3</volume><fpage>e2654</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pone.0002654</pubid><pubid idtype="pmcid">2441452</pubid><pubid idtype="pmpid">18612387</pubid></pubidlist></xrefbib></bibl><bibl id="B126"><title><p>Glycogen synthesis in the absence of glycogenin in the yeast <it>Saccharomyces cerevisiae</it>.</p></title><aug><au><snm>Torija</snm><fnm>MJ</fnm></au><au><snm>Novo</snm><fnm>M</fnm></au><au><snm>Lemassu</snm><fnm>A</fnm></au><au><snm>Wilson</snm><fnm>W</fnm></au><au><snm>Roach</snm><fnm>PJ</fnm></au><au><snm>Fran&#231;ois</snm><fnm>J</fnm></au><au><snm>Parrou</snm><fnm>JL</fnm></au></aug><source>FEBS Lett</source><pubdate>2005</pubdate><volume>579</volume><fpage>3999</fpage><lpage>4004</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.febslet.2005.06.007</pubid><pubid idtype="pmpid" link="fulltext">16004992</pubid></pubidlist></xrefbib></bibl><bibl id="B127"><title><p>Metabolic symbiosis and the birth of the plant kingdom.</p></title><aug><au><snm>Deschamps</snm><fnm>P</fnm></au><au><snm>Colleoni</snm><fnm>C</fnm></au><au><snm>Nakamura</snm><fnm>Y</fnm></au><au><snm>Suzuki</snm><fnm>E</fnm></au><au><snm>Putaux</snm><fnm>JL</fnm></au><au><snm>Bul&#233;on</snm><fnm>A</fnm></au><au><snm>Haebel</snm><fnm>S</fnm></au><au><snm>Ritte</snm><fnm>G</fnm></au><au><snm>Steup</snm><fnm>M</fnm></au><au><snm>Falc&#243;n</snm><fnm>LI</fnm></au><au><snm>Moreira</snm><fnm>D</fnm></au><au><snm>L&#246;ffelhardt</snm><fnm>W</fnm></au><au><snm>Raj</snm><fnm>JN</fnm></au><au><snm>Plancke</snm><fnm>C</fnm></au><au><snm>d&apos;Hulst</snm><fnm>C</fnm></au><au><snm>Dauvill&#233;e</snm><fnm>D</fnm></au><au><snm>Ball</snm><fnm>S</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2008</pubdate><volume>25</volume><fpage>536</fpage><lpage>548</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msm280</pubid><pubid idtype="pmpid" link="fulltext">18093994</pubid></pubidlist></xrefbib></bibl><bibl id="B128"><title><p>New insights on trehalose: a multifunctional molecule.</p></title><aug><au><snm>Elbein</snm><fnm>AD</fnm></au><au><snm>Pan</snm><fnm>YT</fnm></au><au><snm>Pastuszak</snm><fnm>I</fnm></au><au><snm>Carroll</snm><fnm>D</fnm></au></aug><source>Glycobiology</source><pubdate>2003</pubdate><volume>13</volume><fpage>17R</fpage><lpage>27R</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/glycob/cwg047</pubid><pubid idtype="pmpid" link="fulltext">12626396</pubid></pubidlist></xrefbib></bibl><bibl id="B129"><title><p>The cellulose synthase gene of <it>Dictyostelium</it>.</p></title><aug><au><snm>Blanton</snm><fnm>RL</fnm></au><au><snm>Fuller</snm><fnm>D</fnm></au><au><snm>Iranfar</snm><fnm>N</fnm></au><au><snm>Grimson</snm><fnm>MJ</fnm></au><au><snm>Loomis</snm><fnm>WF</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2000</pubdate><volume>97</volume><fpage>2391</fpage><lpage>2396</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.040565697</pubid><pubid idtype="pmcid">15811</pubid><pubid idtype="pmpid">10681463</pubid></pubidlist></xrefbib></bibl><bibl id="B130"><title><p>Cellulose-binding modules from extracellular matrix proteins of <it>Dictyostelium discoideum </it>stalk and sheath.</p></title><aug><au><snm>Wang</snm><fnm>YZ</fnm></au><au><snm>Slade</snm><fnm>MB</fnm></au><au><snm>Gooley</snm><fnm>AA</fnm></au><au><snm>Atwell</snm><fnm>BJ</fnm></au><au><snm>Williams</snm><fnm>KL</fnm></au></aug><source>Eur J Biochem</source><pubdate>2001</pubdate><volume>268</volume><fpage>4334</fpage><lpage>4345</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1046/j.1432-1327.2001.02354.x</pubid><pubid idtype="pmpid" link="fulltext">11488929</pubid></pubidlist></xrefbib></bibl><bibl id="B131"><title><p>Dependence of stress resistance on a spore coat heteropolysaccharide in <it>Dictyostelium</it>.</p></title><aug><au><snm>West</snm><fnm>CM</fnm></au><au><snm>Nguyen</snm><fnm>P</fnm></au><au><snm>van der Wel</snm><fnm>H</fnm></au><au><snm>Metcalf</snm><fnm>T</fnm></au><au><snm>Sweeney</snm><fnm>KR</fnm></au><au><snm>Blader</snm><fnm>IJ</fnm></au><au><snm>Erdos</snm><fnm>GW</fnm></au></aug><source>Eukaryot Cell</source><pubdate>2009</pubdate><volume>8</volume><fpage>27</fpage><lpage>36</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1128/EC.00398-07</pubid><pubid idtype="pmcid">2620749</pubid><pubid idtype="pmpid">18996984</pubid></pubidlist></xrefbib></bibl><bibl id="B132"><title><p>Comparative analysis of spore coat formation, structure, and function in <it>Dictyostelium</it>.</p></title><aug><au><snm>West</snm><fnm>CM</fnm></au></aug><source>Int Rev Cytol</source><pubdate>2003</pubdate><volume>222</volume><fpage>237</fpage><lpage>293</lpage><xrefbib><pubidlist><pubid idtype="doi">full_text</pubid><pubid idtype="pmpid">12503851</pubid></pubidlist></xrefbib></bibl><bibl id="B133"><title><p>The compositional adjustment of amino acid substitution matrices.</p></title><aug><au><snm>Yu</snm><fnm>YK</fnm></au><au><snm>Wootton</snm><fnm>JC</fnm></au><au><snm>Altschul</snm><fnm>SF</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2003</pubdate><volume>100</volume><fpage>15688</fpage><lpage>15693</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.2533904100</pubid><pubid idtype="pmcid">307629</pubid><pubid idtype="pmpid">14663142</pubid></pubidlist></xrefbib></bibl><bibl id="B134"><title><p>Dynamic use of multiple parameter sets in sequence alignment.</p></title><aug><au><snm>Huang</snm><fnm>X</fnm></au><au><snm>Brutlag</snm><fnm>DL</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2007</pubdate><volume>35</volume><fpage>678</fpage><lpage>686</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkl1063</pubid><pubid idtype="pmcid">1802605</pubid><pubid idtype="pmpid">17182633</pubid></pubidlist></xrefbib></bibl><bibl id="B135"><title><p>PAML 4: phylogenetic analysis by maximum likelihood.</p></title><aug><au><snm>Yang</snm><fnm>Z</fnm></au></aug><source>Mol Biol Evol</source><pubdate>2007</pubdate><volume>24</volume><fpage>1586</fpage><lpage>1591</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msm088</pubid><pubid idtype="pmpid" link="fulltext">17483113</pubid></pubidlist></xrefbib></bibl><bibl id="B136"><title><p>Genome-wide identification of genes likely to be involved in human genetic disease.</p></title><aug><au><snm>Lopez-Bigas</snm><fnm>N</fnm></au><au><snm>Ouzounis</snm><fnm>CA</fnm></au></aug><source>Nucleic Acids Res</source><pubdate>2004</pubdate><volume>32</volume><fpage>3108</fpage><lpage>3114</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/nar/gkh605</pubid><pubid idtype="pmcid">434425</pubid><pubid idtype="pmpid">15181176</pubid></pubidlist></xrefbib></bibl></refgrp>
</bm></art>