<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2004-5-9-r72</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Method</dochead>
      <bibl>
         <title>
            <p>Large-scale exploration of growth inhibition caused by overexpression of genomic fragments in <it>Saccharomyces cerevisiae</it></p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Boyer</snm>
               <fnm>Jeanne</fnm>
               <insr iid="I1"/>
               <email>jboyer@pasteur.fr</email>
            </au>
            <au id="A2">
               <snm>Badis</snm>
               <fnm>Gwena&#235;l</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>gbreard@pasteur.fr</email>
            </au>
            <au id="A3">
               <snm>Fairhead</snm>
               <fnm>C&#233;cile</fnm>
               <insr iid="I1"/>
               <email>cfair@pasteur.fr</email>
            </au>
            <au id="A4">
               <snm>Talla</snm>
               <fnm>Emmanuel</fnm>
               <insr iid="I1"/>
               <insr iid="I3"/>
               <email>etalla@pasteur.fr</email>
            </au>
            <au id="A5">
               <snm>Hantraye</snm>
               <fnm>Florence</fnm>
               <insr iid="I2"/>
               <email>fricard@pasteur.fr</email>
            </au>
            <au id="A6">
               <snm>Fabre</snm>
               <fnm>Emmanuelle</fnm>
               <insr iid="I1"/>
               <email>efabre@pasteur.fr</email>
            </au>
            <au id="A7">
               <snm>Fischer</snm>
               <fnm>Gilles</fnm>
               <insr iid="I1"/>
               <email>fischer@pasteur.fr</email>
            </au>
            <au id="A8">
               <snm>Hennequin</snm>
               <fnm>Christophe</fnm>
               <insr iid="I1"/>
               <insr iid="I4"/>
               <email>chenneq@pasteur.fr</email>
            </au>
            <au id="A9">
               <snm>Koszul</snm>
               <fnm>Romain</fnm>
               <insr iid="I1"/>
               <email>koszul@pasteur.fr</email>
            </au>
            <au id="A10">
               <snm>Lafontaine</snm>
               <fnm>Ingrid</fnm>
               <insr iid="I1"/>
               <email>ingridl@pasteur.fr</email>
            </au>
            <au id="A11">
               <snm>Ozier-Kalogeropoulos</snm>
               <fnm>Odile</fnm>
               <insr iid="I1"/>
               <email>odozier@pasteur.fr</email>
            </au>
            <au id="A12">
               <snm>Ricchetti</snm>
               <fnm>Miria</fnm>
               <insr iid="I1"/>
               <insr iid="I5"/>
               <email>mricch@pasteur.fr</email>
            </au>
            <au id="A13">
               <snm>Richard</snm>
               <fnm>Guy-Franck</fnm>
               <insr iid="I1"/>
               <email>gfrichar@pasteur.fr</email>
            </au>
            <au id="A14">
               <snm>Thierry</snm>
               <fnm>Agn&#232;s</fnm>
               <insr iid="I1"/>
               <email>athierry@pasteur.fr</email>
            </au>
            <au id="A15">
               <snm>Dujon</snm>
               <fnm>Bernard</fnm>
               <insr iid="I1"/>
               <email>bdujon@pasteur.fr</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Unit&#233; de G&#233;n&#233;tique Mol&#233;culaire des Levures (URA2171 CNRS and UFR 927 Universit&#233; Pierre et Marie Curie)</p>
            </ins>
            <ins id="I2">
               <p>Unit&#233; de G&#233;n&#233;tique des Interactions Macromol&#233;culaires (URA2171 CNRS), Department of Structure and Dynamics of Genomes, Institut Pasteur, 25 rue du Dr Roux, 75724 Paris-Cedex 15, France</p>
            </ins>
            <ins id="I3">
               <p>CNRS-Laboratoire de Chimie Bact&#233;rienne, 31 Chemin Joseph Aiguier, 13402 Marseille-Cedex 20, France</p>
            </ins>
            <ins id="I4">
               <p>Laboratoire de Parasitologie, Facult&#233; de M&#233;decine St-Antoine, 27 rue de Chaligny, 75012 Paris, France</p>
            </ins>
            <ins id="I5">
               <p>Unit&#233; de G&#233;n&#233;tique et Biochimie du D&#233;veloppement, Institut Pasteur, 25 rue du Dr Roux 75724 Paris-Cedex 15, France</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2004</pubdate>
         <volume>5</volume>
         <issue>9</issue>
         <fpage>R72</fpage>
         <url>http://genomebiology.com/2004/5/9/R72</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">15345056</pubid>
               <pubid idtype="doi">10.1186/gb-2004-5-9-r72</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>24</day>
               <month>5</month>
               <year>2004</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>13</day>
               <month>7</month>
               <year>2004</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>26</day>
               <month>7</month>
               <year>2004</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>31</day>
               <month>8</month>
               <year>2004</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2004</year>
         <collab>Boyer et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. </note>
      </cpyrt>
      <shorttitle>
         <p>Large-scale exploration of growth inhibition caused by overexpression of genomic fragments in <it>Saccharomyces cerevisiae</it></p>
      </shorttitle>
      <shortabs>
         <p>A screen of the <it>Saccharomyces cerevisiae</it> genome for fragments conferring a growth-impairment phenotype identified 714 fragments in about 84,000 clones tested.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <p>We have screened the genome of <it>Saccharomyces cerevisiae </it>for fragments that confer a growth-retardation phenotype when overexpressed in a multicopy plasmid with a tetracycline-regulatable (Tet-off) promoter. We selected 714 such fragments with a mean size of 700 base-pairs out of around 84,000 clones tested. These include 493 in-frame open reading frame fragments corresponding to 454 distinct genes (of which 91 are of unknown function), and 162 out-of-frame, antisense and intergenic genomic fragments, representing the largest collection of toxic inserts published so far in yeast.</p>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010009">Genetics</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010013">Methods</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010014">Microbiology and parasitology</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010015">Model organisms</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The complete genome sequences of various eukaryotic model organisms such as <it>Saccharomyces cerevisiae</it>, <it>Caenorhabditis elegans</it>, <it>Drosophila melanogaster</it>, <it>Arabidopsis thaliana </it>and <it>Schizosaccharomyces pombe</it>, have revealed a large number of novel genes of unknown functions. In <it>S. cerevisiae</it>, for example, around 1,800 genes (of the total of around 5,800) encode proteins that so far remain functionally uncharacterized (compilation from <it>Saccharomyces </it>Genome Database (SGD) <abbrgrp><abbr bid="B1">1</abbr></abbrgrp> April 2004). Since the completion of its DNA sequence <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, the genome of <it>S. cerevisiae </it>has been extensively studied, serving as a test case for novel and important developments in functional genomics. Such developments include transposon-mediated gene inactivation and tagging <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>, the analysis of gene-expression networks through partial or complete transcriptome studies <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr></abbrgrp>, two-hybrid screening <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>, protein-complex purification <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr></abbrgrp>, two-dimensional gel protein identification <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>, proteome qualitative analysis by protein microarrays (see review in <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>) and protein abundance measurements after <it>in situ </it>gene tagging <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. Even intergenic regions have been studied using microarray technology to characterize transcription-factor-binding sites and to map replication origins or recombination hotspots <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp> (see also <abbrgrp><abbr bid="B17">17</abbr></abbrgrp> for a review). Following a large cooperative effort between European and American labs, a nearly complete collection of deletion mutants of all yeast protein-coding genes is now available <abbrgrp><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>, which offers the possibility of systematically screening numerous phenotypes, including synthetic lethals <abbrgrp><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp>, in search of novel gene functions.</p>
         <p>As a complement to gene inactivation, phenotypic changes resulting from gene overexpression may also be informative of gene functions. Indeed, in a number of cases, such as genes encoding cytoskeletal proteins or protein kinases and phosphatases, overexpression may lead to a lethal phenotype (see <abbrgrp><abbr bid="B24">24</abbr></abbrgrp> for a review). The overexpression approach is complementary to the loss-of-function approach, as it leads to dominant phenotypes even in the presence of the wild-type gene, thus allowing the study of genes for which no loss-of-function mutants can be obtained. Overexpression of gene fragments can be equivalent to 'dominant negative mutation' in which the fragment disrupts the activity of the wild-type gene <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Overexpression can also activate specific pathways, leading to deleterious phenotypes: examples include genes involved in the yeast pheromone response pathway, such as <it>STE4</it>, <it>STE11 </it>and <it>STE12 </it>(see <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B26">26</abbr></abbrgrp> and references therein). In other cases, specific effects are not known, but the region responsible for toxicity has been identified. For example, lethality upon overexpression of Rap1p depends on the presence of the DNA-binding domain and an adjacent region <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. In general, however, unless the domain structure of the protein is well understood, one cannot predict which segment(s) of it would act as a dominant mutant when overexpressed.</p>
         <p>Several yeast cDNA libraries have been screened for lethal or impaired growth phenotypes upon overexpression under the control of the <it>GAL1 </it>or <it>GAL10 </it>promoters on centromeric or multicopy plasmids <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>. Other libraries of random genomic DNA have also been screened for toxicity upon overexpression from the same promoters <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B26">26</abbr></abbrgrp>. Whereas the four earlier studies each identified only a few genes (from 1 to 24 each, making a grand total of 43), Stevenson <it>et al. </it><abbrgrp><abbr bid="B30">30</abbr></abbrgrp> identified 185 genes (20 of which were shared with earlier work) that cause impaired growth when overexpressed.</p>
         <p>In the work reported here, we have screened the yeast genome with the aim of characterizing a list of fragments whose overexpression confers growth impairment. To do this, we constructed a yeast genomic library in a multicopy plasmid vector in which transcription is driven by a chimeric tetO-<it>CYC1 </it>promoter <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. Random genomic inserts of a mean size of 700 base-pairs (bp) were overexpressed in yeast as translational fusions using the plasmid-borne initiation codon. Out of around 84,000 clones tested, we have identified the largest collection yet of toxic overexpressed fragments in yeast: 714 showed overexpression-dependent lethality or various degrees of growth impairments, identifying 454 protein-coding genes (91 of which are of unknown functions), and a variety of intergenic or other regions.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Screening the library of yeast random genomic fragments for toxic phenotypes</p>
            </st>
            <p>We have analyzed a total of 84,086 independent yeast transformants, each of which contains a random fragment of the yeast genome placed under the control of a doxycyclin-repressible promoter (Figure <figr fid="F1">1a,1b</figr>). Effects on growth or survival were monitored by spotting serial dilutions of the transformants in the presence and absence of doxycyclin (uninduced and overexpression conditions respectively, Figure <figr fid="F1">1c</figr>). Phenotypes were recorded using numerical values from 0 to 3 (Figure <figr fid="F2">2</figr>): value 3 was assigned to normal growth (similar to non-toxic control), 2 and 1 were assigned to intermediate growth levels (less abundant and/or smaller-sized colonies), and 0 was assigned to complete or almost complete absence of colonies (comparable to the toxic control on the same plate). We have retained 714 clones (0.85% of total) that show impaired growth in overexpression conditions (Table <tblr tid="T1">1</tblr>). Among these, 112 also show a slight or severe growth reduction (level 2 for 77 cases, or level 1 for 35 cases, respectively) in unexpressed conditions. Proof that the observed growth defects were caused by the presence of the plasmid rather than an accidental mutation in the clone was directly demonstrated by the recovery of the wild-type phenotype after plasmid loss using selection for resistance to 5-fluoroorotic acid (5-FOA) (Figure <figr fid="F2">2</figr>).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Overexpression library construction and screening</p>
               </caption>
               <text>
                  <p>Overexpression library construction and screening. <b>(a) </b>Construction of an HA-tagged vector. The pCMha190 vector used here was constructed by insertion of a linker (gray box) in place of the multiple cloning site in vector pCM190 [31]. Features shown include the promoter and TATA box as well as the terminator from the original plasmid (open boxes), and the start codon, HA-tag, <it>Bam</it>HI site and stop codons (thick vertical bars) from the introduced linker sequence. The linker was composed from the following annealed oligonucleotides: EXP3: 5'-GATCGTTTAAACCATATGTACCCATACGACGTCCCAGACTACGCTGG ATCCTGACTGACTGATC-3', EXP4: 5'-GGCCGATCAGTCAGTCAGGATCCAGCGT AGTCTGGGACGTCGTATGGGTACATATGGTTTAAAC-3'. <b>(b) </b>Library construction in pCMha190 (see Materials and methods for experimental details). The resulting ligation product is schematized, with the insert as a striped box and adaptors as hatched boxes. Sequences shown below are from junctions, with uppercase letters corresponding to vector (the extra nucleotide from filling-in is underlined), lowercase letters to adaptors and bold nnn's to insert. Arrows indicate the different primers used: SEQ8 and SEQ4 are used for PCR amplification of the insert, and SEQ1 for sequencing (see sequences in Additional data file 8). <b>(c) </b>First-round screening of toxic phenotypes. The growth of random and control clones on selective medium in uninduced and overexpression conditions is shown. Drops of serial dilutions (1/100 to 1/100,000) of cultures were grown for 45 h at 30&#176;C. A3, non-toxic control clone transformed by pCMha190; H1, toxic control clone transformed by <it>MCM1 </it>gene cloned in pCMha190; G1, B2, D2, E3, library transformed clones, exhibiting different levels of toxicity in overexpression conditions (see Figure 2).</p>
               </text>
               <graphic file="gb-2004-5-9-r72-1"/>
            </fig>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Second-round scoring of toxic phenotypes and control</p>
               </caption>
               <text>
                  <p>Second-round scoring of toxic phenotypes and control. <b>(a) </b>Selected clones from the first round were diluted and three drops (1/100, 1/1,000 and 1/10,000) were spotted and grown for 42 h at 30&#176;C, with controls on same plates, for confirmation of toxicity. Growth levels in the presence and absence of doxycycline were scored as described in the text. Each clone was assigned a growth index where the first number represents the growth in uninduced conditions and second number the growth in induced conditions; for example, 3/3 indicates a non-toxic insert; 3/0 indicates a highly toxic insert. Clone numbers are the same as in the tables describing the toxic inserts (see Additional file 1,2,3,4). <b>(b) </b>After 5-FOA-induced plasmid loss, growth of surviving clones is scored in the same way as in (a). Wild-type phenotypes in overexpression conditions are indicative of plasmid-borne toxicity.</p>
               </text>
               <graphic file="gb-2004-5-9-r72-2"/>
            </fig>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Distribution of the toxic inserts between the different genetic objects</p>
               </caption>
               <tblbdy cols="9">
                  <r>
                     <c ca="left">
                        <p>Genetic objects represented</p>
                     </c>
                     <c ca="center">
                        <p>Number of toxic inserts</p>
                     </c>
                     <c ca="center">
                        <p>Percentage of total</p>
                     </c>
                     <c ca="center">
                        <p>Mean size &#177; SD (nucleotides) (minimum-maximum)</p>
                     </c>
                     <c cspan="4" ca="center">
                        <p>Phenotypes</p>
                     </c>
                     <c ca="center">
                        <p>Inserts encoding artificial peptides</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="4">
                        <hr/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>3/0, 3/1</p>
                     </c>
                     <c ca="center">
                        <p>3/2</p>
                     </c>
                     <c ca="center">
                        <p>2/0, 2/1</p>
                     </c>
                     <c ca="center">
                        <p>1/0</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="9">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>In-frame ORF fragments</p>
                     </c>
                     <c ca="center">
                        <p>493</p>
                     </c>
                     <c ca="center">
                        <p>68.7</p>
                     </c>
                     <c ca="center">
                        <p>743 &#177; 311 (220-2,120)</p>
                     </c>
                     <c ca="center">
                        <p>375</p>
                     </c>
                     <c ca="center">
                        <p>87</p>
                     </c>
                     <c ca="center">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>_</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Antiparallel ORF fragments</p>
                     </c>
                     <c ca="center">
                        <p>68</p>
                     </c>
                     <c ca="center">
                        <p>9.6</p>
                     </c>
                     <c ca="center">
                        <p>532 &#177; 247 (140-1,220)</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>53</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Out-of-frame ORF fragments</p>
                     </c>
                     <c ca="center">
                        <p>53</p>
                     </c>
                     <c ca="center">
                        <p>7.5</p>
                     </c>
                     <c ca="center">
                        <p>733 &#177; 306 (170-1,620)</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Intergenic regions</p>
                     </c>
                     <c ca="center">
                        <p>41</p>
                     </c>
                     <c ca="center">
                        <p>6.0</p>
                     </c>
                     <c ca="center">
                        <p>625 &#177; 358 (170-1,820)</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>LTRs</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.3</p>
                     </c>
                     <c ca="center">
                        <p>595 (320-1,120)</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ty elements</p>
                     </c>
                     <c ca="center">
                        <p>15 (10)</p>
                     </c>
                     <c ca="center">
                        <p>2.1</p>
                     </c>
                     <c ca="center">
                        <p>633 &#177; 265 (320-870)</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>_</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Y' elements</p>
                     </c>
                     <c ca="center">
                        <p>9 (3)</p>
                     </c>
                     <c ca="center">
                        <p>1.2</p>
                     </c>
                     <c ca="center">
                        <p>678 &#177; 370 (320-1,320)</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>RNA genes</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.5</p>
                     </c>
                     <c ca="center">
                        <p>662 &#177; 246 (470-1,020)</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2 &#956;m plasmid</p>
                     </c>
                     <c ca="center">
                        <p>17 (10)</p>
                     </c>
                     <c ca="center">
                        <p>2.4</p>
                     </c>
                     <c ca="center">
                        <p>564 &#177; 288 (170-1,220)</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Mitochondrial DNA</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>1.7</p>
                     </c>
                     <c ca="center">
                        <p>483 &#177; 201 (200-920)</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>714</p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                     <c ca="center">
                        <p>703 &#177; 313 (140-2,120)</p>
                     </c>
                     <c ca="center">
                        <p>479</p>
                     </c>
                     <c ca="center">
                        <p>123</p>
                     </c>
                     <c ca="center">
                        <p>77</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>117</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>The first column indicates nature of sequence in toxic inserts. Second and third columns contain, respectively, actual number of inserts of each type and corresponding percentages. For Tys, Y' and 2 &#956;m plasmid, numbers in brackets represent numbers of in-frame fragments of natural ORFs. The fourth column shows the mean size of insert in nucleotides &#177; standard deviation (SD) with minimum and maximum sizes in brackets. Scoring of each type of phenotype is shown in the next four columns. The last column shows the number of inserts in which artificial ORFs of more than 24 codons were detected.</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Identification of the genomic inserts conferring toxic phenotypes</p>
            </st>
            <p>Inserts of the selected clones were identified by DNA sequencing (Materials and methods). The complete list of inserts is described in Additional file 1 and 2, and results are summarized in Table <tblr tid="T1">1</tblr>. A majority of inserts (493, or 69% of total) carry in-frame portions of annotated open reading frames (ORFs), excluding Ty and Y' ORFs. In addition, a significant number of inserts (162 (23%)) correspond to fragments of ORFs cloned either in antiparallel orientation or out-of-frame with respect to the initiator ATG codon or to intergenic regions. The 59 remaining cases (8% of total) correspond to fragments of transposable elements (17 clones) and subtelomeric Y' elements (9 clones), to RNA-coding genes (4 clones), and to non-chromosomal replicons such as the 2 &#956;m plasmid and mitochondrial DNA (mtDNA) (29 clones). If any random fragment of the yeast genome were capable of generating a toxic phenotype, in-frame ORF fusions would represent only around 10-12% of the selected inserts (around 70% of the genome correspond to coding regions, and only one frame out of six corresponds to the natural frame). The fact that the toxic inserts correspond principally to in-frame portions of natural ORFs suggests that the coding part of the genome is the most prone to confer toxicity when overexpressed.</p>
         </sec>
         <sec>
            <st>
               <p>Analysis of domains within in-frame ORF fragments</p>
            </st>
            <p>The 493 inserts corresponding to in-frame ORF fragments represent 454 distinct annotated ORFs (see Materials and methods), which are randomly distributed throughout the 16 chromosomes of <it>S. cerevisiae </it>(see Additional file 1). In our screening, 32 ORFs were found twice, two ORFs were found three times and one ORF (<it>YHR056</it>c in the <it>CUP1 </it>region) was found four times, the cloned fragments being either overlapping (22 ORFs) or non-overlapping (13 ORFs). Mean size of the coding region of inserts is 659 bp. The chosen cloning strategy favors recovery of central-or carboxy-terminal coding parts of the natural yeast genes, whereas the amino-terminal coding regions are rare <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. In our work, the cloned insert encompasses the entire gene in only six cases (additional file 3, column 20 to 23). In 154 additional cases, the insert corresponds to the carboxy-terminal portion of the natural protein (the stop codon is present). In 10 cases, the inserts start upstream of the natural ATG initiator codons, lengthening the natural peptides by reading in-frame through the untranslated region. Other cases correspond to the central coding region of natural genes.</p>
            <p>To find possible common characteristics, we have compared between themselves all the peptides encoded by in-frame ORF fragments. BLASTP analysis was combined with detection of characterized conserved domains, of COG patterns (clusters of predicted orthologous groups of proteins <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>), and of transmembrane spans (TMS) to identify toxic inserts similar to each other (see Materials and methods). Out of the 493 in-frame ORF fragments, a total of 170 were divided up into 57 distinct groups of similarity, containing from two to 12 inserts, including overlapping fragments of the same ORF (see Additional file 4). It is expected that several ORFs from a same paralogous gene family are found in a same group. Note that in 16 out of 57 groups, the inserts contain transport-specific domains and/or transmembrane spans.</p>
            <p>As well as comparing inserts to each other, we also analyzed the totality of the conserved domains present in all peptides encoded by the 493 toxic inserts (see Materials and methods). Characterized domains are found, at least partially, in a total of 281 inserts (see additional file 1 and 3). Of a total of 183 distinct domains, 46 are represented more than once. We have compared the frequency of these 46 domains among the toxic inserts versus their frequency among the 5,803 ORF-encoded proteins of the entire genome (Table <tblr tid="T2">2</tblr>). We find that 37 domains are significantly over-represented compared to a random expectation, suggesting that we have screened specific domains.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Conserved domains found more than once among the toxic in-frame ORF fragments</p>
               </caption>
               <tblbdy cols="8">
                  <r>
                     <c ca="left">
                        <p>Domain reference</p>
                     </c>
                     <c ca="left">
                        <p>Domain name</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>S. cerevisiae</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Toxic inserts</p>
                     </c>
                     <c ca="center">
                        <p>Mean</p>
                     </c>
                     <c ca="center">
                        <p>95% confidence interval</p>
                     </c>
                     <c ca="center">
                        <p>Result</p>
                     </c>
                     <c ca="center">
                        <p>Domain description</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="8">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c cspan="8" ca="left">
                        <p>
                           <b>Transport-specific domains</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG0471</p>
                     </c>
                     <c ca="left">
                        <p>CitT</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.17-1.25</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Di-and tricarboxylate transporter</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam03169</p>
                     </c>
                     <c ca="left">
                        <p>OPT</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.16</p>
                     </c>
                     <c ca="center">
                        <p>0.11-1.17</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Oligopeptide transporter protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1953</p>
                     </c>
                     <c ca="left">
                        <p>FUI1</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.48</p>
                     </c>
                     <c ca="center">
                        <p>0.44-1.56</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Nucleotide transporter</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00324</p>
                     </c>
                     <c ca="left">
                        <p>aa_permeases</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>1.16</p>
                     </c>
                     <c ca="center">
                        <p>1.04-2.22</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Amino acid permease</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00153</p>
                     </c>
                     <c ca="left">
                        <p>mito_carr</p>
                     </c>
                     <c ca="center">
                        <p>97</p>
                     </c>
                     <c ca="center">
                        <p>24</p>
                     </c>
                     <c ca="center">
                        <p>5.13</p>
                     </c>
                     <c ca="center">
                        <p>5.07-6.45</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Mitochondrial carrier protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG0531</p>
                     </c>
                     <c ca="left">
                        <p>PotE</p>
                     </c>
                     <c ca="center">
                        <p>26</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>1.38</p>
                     </c>
                     <c ca="center">
                        <p>1.28-2.48</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Amino acid transporter</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG0474</p>
                     </c>
                     <c ca="left">
                        <p>MgtA</p>
                     </c>
                     <c ca="center">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>1.22</p>
                     </c>
                     <c ca="center">
                        <p>1.12-2.30</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Cation transport ATPase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cd00267</p>
                     </c>
                     <c ca="left">
                        <p>ABC_ATPase</p>
                     </c>
                     <c ca="center">
                        <p>58</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>3.07</p>
                     </c>
                     <c ca="center">
                        <p>2.93-4.22</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>ABC transporter nucleotide-binding domain</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00664</p>
                     </c>
                     <c ca="left">
                        <p>ABC_membrane</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.74</p>
                     </c>
                     <c ca="center">
                        <p>0.68-1.82</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>ABC transporter transmembrane region</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG0842</p>
                     </c>
                     <c ca="left">
                        <p>COG0842</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.32</p>
                     </c>
                     <c ca="center">
                        <p>0.29-1.38</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>ABC-type multidrug transport system, permease component</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1131</p>
                     </c>
                     <c ca="left">
                        <p>CcmA</p>
                     </c>
                     <c ca="center">
                        <p>54</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2.86</p>
                     </c>
                     <c ca="center">
                        <p>2.74-4.01</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>ABC-type multidrug transport system, ATPase component</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00083</p>
                     </c>
                     <c ca="left">
                        <p>Sugar_tr</p>
                     </c>
                     <c ca="center">
                        <p>58</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>3.07</p>
                     </c>
                     <c ca="center">
                        <p>2.94-4.23</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Sugar (and other) transporter</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="8" ca="left">
                        <p>
                           <b>RNA-and DNA-binding domains</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00076</p>
                     </c>
                     <c ca="left">
                        <p>rrm</p>
                     </c>
                     <c ca="center">
                        <p>72</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>3.81</p>
                     </c>
                     <c ca="center">
                        <p>3.62-4.95</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>RNA recognition motif (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5099</p>
                     </c>
                     <c ca="left">
                        <p>(PUF)</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>0.48</p>
                     </c>
                     <c ca="center">
                        <p>0.44-1.56</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Pumilio family RNA-binding repeat (translational repression)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>smart00322</p>
                     </c>
                     <c ca="left">
                        <p>KH</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.58</p>
                     </c>
                     <c ca="center">
                        <p>0.54-1.66</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>K homology: RNA-binding domain (transcription, RNA metabolism)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>smart00356</p>
                     </c>
                     <c ca="left">
                        <p>ZnF_C3H1</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.26</p>
                     </c>
                     <c ca="center">
                        <p>0.21-1.30</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Zinc finger, C3H1 type (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5048</p>
                     </c>
                     <c ca="left">
                        <p>C2H2-type Zn_finger</p>
                     </c>
                     <c ca="center">
                        <p>15</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.79</p>
                     </c>
                     <c ca="center">
                        <p>0.74-1.89</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Zn-finger (C2H2-type) (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG0210</p>
                     </c>
                     <c ca="left">
                        <p>UvrD</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.17-1.24</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>DNA and RNA helicases, superfamily I (DNA replication, recombination, repair)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cd00086</p>
                     </c>
                     <c ca="left">
                        <p>Homeodomain</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.48</p>
                     </c>
                     <c ca="center">
                        <p>0.45-1.57</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>DNA binding domain (eukaryotic development)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00249</p>
                     </c>
                     <c ca="left">
                        <p>myb_DNA-binding</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.69</p>
                     </c>
                     <c ca="center">
                        <p>0.66-1.80</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Myb-like DNA-binding domain (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00170</p>
                     </c>
                     <c ca="left">
                        <p>bZIP</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.17-1.25</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Basic-leucine zipper DNA binding and dimerization domains (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>smart00066</p>
                     </c>
                     <c ca="left">
                        <p>GAL4</p>
                     </c>
                     <c ca="center">
                        <p>48</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2.54</p>
                     </c>
                     <c ca="center">
                        <p>2.44-3.72</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>GAL4-like Zn(II)2Cys6 DNA-binding domain (fungal) (transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam04082</p>
                     </c>
                     <c ca="left">
                        <p>Fungal_trans</p>
                     </c>
                     <c ca="center">
                        <p>26</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1.38</p>
                     </c>
                     <c ca="center">
                        <p>1.29-2.48</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>Fungal specific transcription factor domain.</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00270</p>
                     </c>
                     <c ca="left">
                        <p>DEAD</p>
                     </c>
                     <c ca="center">
                        <p>48</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>2.54</p>
                     </c>
                     <c ca="center">
                        <p>2.38-3.63</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>DEAD/DEAH box helicase (replication, repair, transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cd00079</p>
                     </c>
                     <c ca="left">
                        <p>HELICc</p>
                     </c>
                     <c ca="center">
                        <p>60</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>3.18</p>
                     </c>
                     <c ca="center">
                        <p>3.08-4.34</p>
                     </c>
                     <c ca="center">
                        <p>_</p>
                     </c>
                     <c ca="left">
                        <p>Helicase superfamily, C-ter domain (replication, repair, transcription)</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="8" ca="left">
                        <p>
                           <b>Domains involved in Interactions with peptides, proteins or phospholipids</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cd00200</p>
                     </c>
                     <c ca="left">
                        <p>WD40</p>
                     </c>
                     <c ca="center">
                        <p>327</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>17.31</p>
                     </c>
                     <c ca="center">
                        <p>16.87-18.54</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Tandem repeats of about 40 residues interacting with peptides</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam01602</p>
                     </c>
                     <c ca="left">
                        <p>Adaptin_N</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.48</p>
                     </c>
                     <c ca="center">
                        <p>0.43-1.54</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>N-ter region of adaptor proteins (clathrin-coated pits and vesicles)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00786</p>
                     </c>
                     <c ca="left">
                        <p>PBD</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.20-1.27</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>P21-Rho-binding domain (or CRIB)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00169</p>
                     </c>
                     <c ca="left">
                        <p>PH</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.58</p>
                     </c>
                     <c ca="center">
                        <p>0.55-1.67</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>PH: pleckstrin homology. binds phosphoinositides or other ligands (signalling)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5271</p>
                     </c>
                     <c ca="left">
                        <p>MDN1</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.85</p>
                     </c>
                     <c ca="center">
                        <p>0.78-1.93</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>AAA : ATPase with von Willebrand factor type A domain (multiprot. complexes)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>smart00268</p>
                     </c>
                     <c ca="left">
                        <p>ACTIN</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.74</p>
                     </c>
                     <c ca="center">
                        <p>0.67-1.82</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>ACTIN, cytoskeleton/motor protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5022</p>
                     </c>
                     <c ca="left">
                        <p>Myosin heavy chain</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>0.37</p>
                     </c>
                     <c ca="center">
                        <p>0.33-1.43</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>ATPase, molecular motor</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5043</p>
                     </c>
                     <c ca="left">
                        <p>MRS6</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.17-1.24</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Vacuolar protein sorting-associated protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>KOG0446*</p>
                     </c>
                     <c ca="left">
                        <p>Dynamin</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.16</p>
                     </c>
                     <c ca="center">
                        <p>0.13-1.20</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>GTPase that mediates vesicle trafficking</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="8" ca="left">
                        <p>
                           <b>Metabolism-related domains</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam03901</p>
                     </c>
                     <c ca="left">
                        <p>PMP</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>0.21-1.29</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Mannosyltransferase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1928</p>
                     </c>
                     <c ca="left">
                        <p>PMT1</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.37</p>
                     </c>
                     <c ca="center">
                        <p>0.30-1.40</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Mannosyltransferase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00561</p>
                     </c>
                     <c ca="left">
                        <p>Abhydrolase</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.95</p>
                     </c>
                     <c ca="center">
                        <p>0.88-2.05</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Abhydrolase, alpha/beta hydrolase fold (catalytic domain)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00107</p>
                     </c>
                     <c ca="left">
                        <p>ADH_zinc_N</p>
                     </c>
                     <c ca="center">
                        <p>21</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1.11</p>
                     </c>
                     <c ca="center">
                        <p>1.01-2.19</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>Zinc-binding dehydrogenase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00501</p>
                     </c>
                     <c ca="left">
                        <p>AMP-binding</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.58</p>
                     </c>
                     <c ca="center">
                        <p>0.51-1.64</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>AMP-binding synthetase</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="8" ca="left">
                        <p>
                           <b>Other domains</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00674</p>
                     </c>
                     <c ca="left">
                        <p>DUP</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>1.85</p>
                     </c>
                     <c ca="center">
                        <p>1.81-3.03</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>DUP family (proteins of unknown functions)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5384</p>
                     </c>
                     <c ca="left">
                        <p>Mpp10</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.05</p>
                     </c>
                     <c ca="center">
                        <p>0.03-1.07</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>M phase phosphoprotein 10 (U3 small nucleolar ribonucleoprotein component)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG5032</p>
                     </c>
                     <c ca="left">
                        <p>TEL1</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0.42</p>
                     </c>
                     <c ca="center">
                        <p>0.34-1.44</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>PI kinase and protein kinases of the PI kinase family</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1025</p>
                     </c>
                     <c ca="left">
                        <p>Ptr</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.26</p>
                     </c>
                     <c ca="center">
                        <p>0.22-1.31</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Zn-dependent peptidases (secreted/periplasmic, insulinase-like)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam02902</p>
                     </c>
                     <c ca="left">
                        <p>Peptidase_C48</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.11</p>
                     </c>
                     <c ca="center">
                        <p>0.08-1.13</p>
                     </c>
                     <c ca="center">
                        <p>+</p>
                     </c>
                     <c ca="left">
                        <p>Ulp1 protease family, C-terminal catalytic domain</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>pfam00004</p>
                     </c>
                     <c ca="left">
                        <p>AAA</p>
                     </c>
                     <c ca="center">
                        <p>43</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>2.28</p>
                     </c>
                     <c ca="center">
                        <p>2.15-3.39</p>
                     </c>
                     <c ca="center">
                        <p>NS</p>
                     </c>
                     <c ca="left">
                        <p>AAA, ATPase family associated with various cellular activities (AAA)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>smart00220</p>
                     </c>
                     <c ca="left">
                        <p>S_TKc</p>
                     </c>
                     <c ca="center">
                        <p>125</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>6.52</p>
                     </c>
                     <c ca="center">
                        <p>6.31-7.72</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="left">
                        <p>Serine/threonine protein kinases, catalytic domain</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Peptide sequences of toxic natural ORF fragments were searched for domains (see text), and the frequency of domains found more than once was compared to the frequency in the whole proteome. References and names of domains are in the first two columns; occurrences in the whole genome (<it>S. cerevisiae</it>) and in the toxic inserts are in the third and fourth columns, respectively. The next three columns show the statistical analysis performed as follows: 1,000 random selections of 843 domains (total number of occurrences in the toxic inserts) were made from the set of 15,925 domains identified in <it>S. cerevisiae </it>(see Materials and methods); mean (column 5) represents the mean number of occurrences of each domain among the toxic inserts; the 95% confidence interval (column 6) was calculated using the SD of the 1,000 random drawings; column 7 shows the result of this analysis for each domain: NS, not significant; +, domain over-represented in toxic inserts; -, domain under-represented in toxic inserts. The last column gives a brief description of domains from NCBI Conserved Domain Database [65]. *KOG0446 was found using cdd.v1.63 of NCBI CD-Search [64].</p>
               </tblfn>
            </tbl>
            <p>These 37 domains correspond predominantly to various transporter domains (11 cases), such as amino-acid permeases and mitochondrial carrier protein domains. The toxicity of these domains is probably due to the presence of transmembrane spans. Indeed, 132 out of the 493 toxic peptides contain at least two transmembrane spans, including cases where one span is putative (see Materials and methods). Among these, 63 contain three or more predicted spans and 26 have five spans or more. Putative spans were also recognized in 84 other ORF fragments (seven with at least three spans, 15 with two spans, and 62 with one span) (see Additional file 1 and 3).</p>
            <p>RNA-and DNA-binding domains (nine cases) involved in replication, transcription or translation functions, such as PUF, KH and rrm, are also much more represented than expected (Table <tblr tid="T2">2</tblr>). The PUF domain is also involved in recruitment of proteins into a complex that controls mRNA translation (see <abbrgrp><abbr bid="B33">33</abbr></abbrgrp> for review).</p>
            <p>Other important domains for interactions with polypeptides, phospholipids or small molecules (nine cases) are also over-represented. The WD40 motif, a propeller-like platform for stable or reversible binding of proteins in eukaryotes, has been found in inserts of 12 distinct ORFs (see additional data file 3). The 12 ORFs code for proteins having interactions with other proteins in complexes related to RNA processing or transcription <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, and nine have at least one partner also selected during our screening (see Discussion). Other interacting domains were found, such as dynamin, MRS6, and adaptin_N domains, which have roles in the dynamics of proteins, membranes and cytoskeleton, and PBD, a small domain which binds small GTPases and inhibits transcription activation. The PH domain, which binds phosphoinositides or other ligands and is involved in signal transduction, was found in inserts of three distinct ORFs involved in different functions: metabolism, cell fate, transcription (see Additional data file 3). Finally, other over-represented domains are related to metabolism and other functions (eight cases), of which several may be involved in interactions with other domains.</p>
            <p>The serine/threonine protein kinase domain (S_TKc) is significantly under-represented in our screen. Among the 10 toxic inserts whose cognate genes code for protein kinases (PK), only four contain this domain (Additional data file 3). In these four cases, the S_TKc domain is either truncated (Additional data file 4), or flanked by a coiled-coil region and/or a low-complexity segment. Two other inserts contain the PBD (and PH) domains, and the four remaining inserts contain no characterized domain to date. As it is known that overexpression of some protein kinases is deleterious for cells (see <abbrgrp><abbr bid="B24">24</abbr></abbrgrp> and references therein), our results suggest that a domain different from the catalytic domain is responsible for the toxicity of these proteins, and that the fragments selected in our screen have a role in binding ligands such as substrates or regulators of protein kinase activity, or of proteins involved in the signaling cascades. Three other genes coding for protein kinases of the phosphatidylinositol 3-kinase (PI kinase) family are also represented in our screen by four toxic inserts, none of which contained the kinase domain (see Discussion).</p>
            <p>The remaining 137 domains (out of 183) were found only once each. Many correspond to functional categories described above, such as transport, metabolism, and interactions with nucleotides, other proteins or other ligands. Seven domains associated with ubiquitination functions were also found (see Additional data file 3 and 5). Several of the domains encountered have also been isolated as mammalian genetic suppressor elements (GSEs), which are cDNA fragments that inhibit cell growth (see <abbrgrp><abbr bid="B34">34</abbr></abbrgrp> and references therein).</p>
            <p>In addition to the domains described above, we found toxic inserts coding for natural peptides without recognizable domains but containing regions of low complexity (56 cases). A number of these peptides are highly charged, either negatively or positively (see Additional data file 3). Such charged peptides might interact in an artifactual way with other charged domains of proteins or nucleic acids or with small molecules. Interestingly, the prion-like (Q+N)-rich domain was found in eight of the natural peptides having low-complexity regions.</p>
         </sec>
         <sec>
            <st>
               <p>Nature of the selected genes</p>
            </st>
            <p>We have seen above that 493/714 toxic inserts are in-frame fragments of protein-coding genes. The complete list of the 454 genes corresponding to these toxic inserts is given in Additional data files 1 and 2. Their sizes range between 282 bp and 14,733 bp. The mean size of this distribution is 2,401 bp (standard deviation (SD) 1,671 bp), to be compared with a mean size of 1,444 bp (SD 1,094 bp) for the entire set of 5,803 ORFs of the yeast genome. The bias towards longer ORFs is expected from our cloning strategy (see above). Note that the 35 ORFs that we found more than once are nearly randomly distributed in various size classes.</p>
            <p>We examined the distribution of these genes according to different criteria, such as function, subcellular localization, viability and phylogeny (Table <tblr tid="T3">3</tblr>) and compared it to the distribution of the genes of <it>S. cerevisiae</it>.</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Distribution of selected genes versus all <it>S. cerevisiae </it>genes</p>
               </caption>
               <tblbdy cols="5">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>All <it>S. cerevisiae </it>genes</p>
                     </c>
                     <c ca="center">
                        <p>Percentage of total</p>
                     </c>
                     <c ca="center">
                        <p>Selected toxic genes</p>
                     </c>
                     <c ca="center">
                        <p>Percentage of total</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Functional classes (MIPS data)</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cell cycle_DNA processing</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>670</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>11.5</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>75</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>16.5*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cell fate</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>486</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>8.4</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>66</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>14.5*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell rescue, defense and virulence</p>
                     </c>
                     <c ca="center">
                        <p>288</p>
                     </c>
                     <c ca="center">
                        <p>5.0</p>
                     </c>
                     <c ca="center">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>5.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cellular communication/signal transduction mechanism</p>
                     </c>
                     <c ca="center">
                        <p>59</p>
                     </c>
                     <c ca="center">
                        <p>1.0</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cellular transport and transport mechanisms</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>525</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>9.0</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>67</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>14.8*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Classification not yet clear-cut</p>
                     </c>
                     <c ca="center">
                        <p>112</p>
                     </c>
                     <c ca="center">
                        <p>1.9</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Control of cellular organization</p>
                     </c>
                     <c ca="center">
                        <p>207</p>
                     </c>
                     <c ca="center">
                        <p>3.6</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>4.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Energy</p>
                     </c>
                     <c ca="center">
                        <p>244</p>
                     </c>
                     <c ca="center">
                        <p>4.2</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>2.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Metabolism</p>
                     </c>
                     <c ca="center">
                        <p>1,061</p>
                     </c>
                     <c ca="center">
                        <p>18.3</p>
                     </c>
                     <c ca="center">
                        <p>88</p>
                     </c>
                     <c ca="center">
                        <p>19.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Protein fate (folding, modification, destination)</p>
                     </c>
                     <c ca="center">
                        <p>593</p>
                     </c>
                     <c ca="center">
                        <p>10.2</p>
                     </c>
                     <c ca="center">
                        <p>47</p>
                     </c>
                     <c ca="center">
                        <p>10.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Protein synthesis</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>377</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>6.5</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.7*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Regulation of/interaction with cell. Environment</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>197</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.4</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>6.4</b>
                           <sup>&#8224;</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Transcription</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>801</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>13.8</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>88</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>19.4*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Transport facilitation</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>321</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>5.5</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>61</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>13.4*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Unclassified</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1,706</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>29.4</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>91</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>20.0*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cellular localization (MIPS data)</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Extracellular</p>
                     </c>
                     <c ca="center">
                        <p>54</p>
                     </c>
                     <c ca="center">
                        <p>1.4</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>1.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell wall</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>1.0</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>1.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Golgi</p>
                     </c>
                     <c ca="center">
                        <p>103</p>
                     </c>
                     <c ca="center">
                        <p>2.6</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>2.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transport vesicles</p>
                     </c>
                     <c ca="center">
                        <p>54</p>
                     </c>
                     <c ca="center">
                        <p>1.4</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Plasma membrane</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>171</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>4.4</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>10.7*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Nucleus</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1,367</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>34.8</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>130</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>40.8</b>
                           <sup>&#8224;</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cytoplasm</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2,001</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>50.9</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>137</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>42.9*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Peroxisome</p>
                     </c>
                     <c ca="center">
                        <p>42</p>
                     </c>
                     <c ca="center">
                        <p>1.1</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Endosome</p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c ca="center">
                        <p>0.5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Cytoskeleton</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>154</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.9</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>6.9</b>
                           <sup>&#8224;</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Vacuole</p>
                     </c>
                     <c ca="center">
                        <p>82</p>
                     </c>
                     <c ca="center">
                        <p>2.1</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>2.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Endoplasmic reticulum</p>
                     </c>
                     <c ca="center">
                        <p>353</p>
                     </c>
                     <c ca="center">
                        <p>9.0</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                     <c ca="center">
                        <p>8.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Mitochondria</p>
                     </c>
                     <c ca="center">
                        <p>562</p>
                     </c>
                     <c ca="center">
                        <p>14.3</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>11.6</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Viability (MIPS data)</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Essential</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>939</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>16.2</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>96</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>21.1</b>
                           <sup>&#8224;</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Essential or not</p>
                     </c>
                     <c ca="center">
                        <p>160</p>
                     </c>
                     <c ca="center">
                        <p>2.8</p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c ca="center">
                        <p>4.4</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Phylogeny (G&#233;nolevures data)</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Conserved</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3,717</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>64.1</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>336</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>74.0*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Ascomycete-specifics</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1674</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>28.8</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>106</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>23.3*</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Orphan</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>412</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>7.1</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.2*</b>
                        </p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>The distribution of genes was examined in respect of four classifications: function, cellular localization of the gene product, viability and phylogeny. Data are from MIPS [38] and G&#233;nolevures [37]. Cellular localization was known for 3,928 out of the 5,803 proteins in the entire genome and for 319 proteins out of the 454 that yield toxic inserts. For other comparisons, the set of 454 selected genes was compared to the set of 5,803 genes of <it>S. cerevisiae</it>. Note that a given gene may be present in more than one MIPS class. Significant evidence that a given gene class is over-or under-represented among toxic genes as compared to all <it>S. cerevisiae </it>genes is emphasized by bold characters. *<it>p </it>&lt; 0.005; <sup>&#8224;</sup><it>p </it>&lt; 0.025.</p>
               </tblfn>
            </tbl>
            <p>Among the 454 ORFs identified, 91 are unclassified, and function is not yet clear for six others (see Additional data file 3). The remaining ORFs represent a variety of functional classes (Table <tblr tid="T3">3</tblr>). Distribution of the 454 ORFs shows statistically significant deviations for eight out of the 15 functional classes, taking into account biases due to mean size of genes in each class. Globally, there is a deficit of genes involved in protein synthesis and of unclassified genes, and an excess of genes involved in transport facilitation and cellular transport (echoing the fact that we found many inserts containing transporter domains and transmembrane spans), in cell fate, in transcription and, to a lesser extent, in cell cycle/DNA processing and in homeostasis (regulation of/interaction with the environment).</p>
            <p>As seen above, many toxic inserts contain multiple predicted TMS. Such inserts correspond most often to genes coding for transporters or for non-transporter membrane proteins <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. We have selected a total of 96 transporters (see Additional data file 3) of which 18 belong to the class of putative uncharacterized transporters, whose toxic inserts contain several TMS. Fourteen others belong to the class of transporters of unknown classification, including 13 genes of the nuclear-pore complex family, whereas there is a total of 58 genes in this family in the whole genome. On the other hand, 24 genes coding for non-transporter membrane proteins were also selected. Taken together, 120 transporters and non-transporter membrane proteins are represented in our screen, twice as many as expected (61 expected), as 782/5,803 ORFs are known or predicted as coding for such proteins <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>.</p>
            <p>The distribution of the proteins encoded by these genes in the cell is strongly biased in favour of the plasma membrane and against the cytoplasm, and, to a lesser extent, in favour of nucleus and cytoskeleton (Table <tblr tid="T3">3</tblr>).</p>
            <p>Although the majority of inserts originate from non-essential genes, we have found 96 essential genes (21%) among the selected ORFs. This is a significantly higher percentage than in the whole genome, where 939/5,803 genes (16.2%) are essential (Table <tblr tid="T3">3</tblr>).</p>
            <p>Using the classification from Malpertuy <it>et al. </it><abbrgrp><abbr bid="B36">36</abbr></abbrgrp> and additional updating (G&#233;nolevures <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>), we find that the majority of genes yielding toxic fragments in this work are conserved (336/454 (74%)) between <it>S. cerevisiae </it>and other sequenced organisms, whereas 106 (23%) are ascomycete-specific and 10 (2.2%) are orphan genes. This distribution is significantly different from the distribution among the 5,803 genes of <it>S. cerevisiae</it>, where 64% of protein-coding genes are conserved (see Table <tblr tid="T3">3</tblr>). The under-representation of orphan genes in our screen is already apparent in the under-representation of functionally unclassified genes, as a high rate of orphans of the whole genome (79%) are also unclassified (data from G&#233;nolevures <abbrgrp><abbr bid="B37">37</abbr></abbrgrp> and Munich Information Center for Protein Sequences (MIPS) <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>).</p>
         </sec>
         <sec>
            <st>
               <p>Toxicity of entire genes versus ORF fragments</p>
            </st>
            <p>To compare the phenotypes conferred by overexpression of the entire gene and of the gene fragment, we have cloned the cognate entire genes of 13 in-frame toxic inserts into the vector pCMha191 (see Materials and methods). One criterion for the choice of the genes was the absence of a mutant phenotype of the corresponding gene disruption at the time this work was started, except for the <it>NOP4 </it>gene whose disruption is lethal. Six of these genes are singletons; three others have a paralog already known as toxic upon overexpression. Six out of the 13 still have no known function to date (Table <tblr tid="T4">4</tblr>). Expression at the protein level of both entire gene and gene fragment was verified by western-blot analysis, using an anti-hemagglutinin (HA) antibody (data not shown). As seen in Table <tblr tid="T4">4</tblr> and Figure <figr fid="F3">3</figr>, we found that overexpression of 10 genes was as toxic or more toxic than overexpression of the gene fragments. One gene, <it>YGR149w</it>, was less toxic in its entire version than in the truncated form, which was weakly toxic. Finally, we found that two genes, <it>YML128c</it>/<it>MSC1 </it>and <it>YDL112w/TRM3</it>, showed no toxicity when overexpressed, whereas the cloned inserts were strongly toxic. In these two cases, the immunolocalization of overexpressed products was examined, and the cytoplasmic localization of the fragment agreed with the location of the natural gene product (data not shown), indicating that the toxic effect is not the result of mislocalization of the overexpressed fragment. The gene <it>MSC1 </it>had already been screened <abbrgrp><abbr bid="B24">24</abbr></abbrgrp> as a toxic fragment in overexpression conditions, the region concerned being the same as in our screening. This gene has low similarity to a stress protein of <it>Schizosaccharomyces pombe </it>and has a role in meiotic recombination. The <it>TRM3 </it>gene contains a carboxy-terminal domain responsible for tRNA methyltransferase activity <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>, which is absent from our insert. The protein is a member of a complex probably involved in signaling <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>.</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>Toxicity of fragments versus whole ORF products</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="left">
                        <p>ORF/Gene name</p>
                     </c>
                     <c ca="left">
                        <p>Gene description</p>
                     </c>
                     <c ca="center">
                        <p>Phenotype of gene deletion</p>
                     </c>
                     <c ca="center">
                        <p>Conserved domain or TMS in entire protein</p>
                     </c>
                     <c ca="center">
                        <p>Phenotype of gene overexpression</p>
                     </c>
                     <c ca="center">
                        <p>Conserved domain or TMS in insert</p>
                     </c>
                     <c ca="center">
                        <p>Phenotype of insert overexpression</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YDL112w/TRM3*</p>
                     </c>
                     <c ca="left">
                        <p>tRNA 2'-O-ribose methyltransferase</p>
                     </c>
                     <c ca="center">
                        <p>Viable</p>
                     </c>
                     <c ca="center">
                        <p>SpoU_methylase</p>
                     </c>
                     <c ca="center">
                        <p>3/3</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>3/1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YML128C/MSC1/ GIN3*<sup>&#8224;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Weak similarity to <it>Schizosaccharomyces pombe </it>stress protein</p>
                     </c>
                     <c ca="center">
                        <p>Viable</p>
                     </c>
                     <c ca="center">
                        <p>1 TMS</p>
                     </c>
                     <c ca="center">
                        <p>3/3</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>3/0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YGR149w/_* <sup>&#8225;&#167;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Similar to <it>S. pombe </it>hypothetical protein</p>
                     </c>
                     <c ca="center">
                        <p>Viable</p>
                     </c>
                     <c ca="center">
                        <p>5 TMS</p>
                     </c>
                     <c ca="center">
                        <p>3/2 to 3/3</p>
                     </c>
                     <c ca="center">
                        <p>3 TMS</p>
                     </c>
                     <c ca="center">
                        <p>3/2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YGL023c/PIB2* <sup>&#167;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Phosphatidylinositol 3-phosphate binding</p>
                     </c>
                     <c ca="center">
                        <p>Viable</p>
                     </c>
                     <c ca="center">
                        <p>FYVE</p>
                     </c>
                     <c ca="center">
                        <p>3/1</p>
                     </c>
                     <c ca="center">
                        <p>FYVE</p>
                     </c>
                     <c ca="center">
                        <p>3/0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YPL043w/NOP4<sup>&#182;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Nucleolar protein, RNA processing</p>
                     </c>
                     <c ca="center">
                        <p>Lethal</p>
                     </c>
                     <c ca="center">
                        <p>RRM (4 motifs)</p>
                     </c>
                     <c ca="center">
                        <p>3/0</p>
                     </c>
                     <c ca="center">
                        <p>Bias D, E, K</p>
                     </c>
                     <c ca="center">
                        <p>3/0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>YOR166c/_ * <sup>&#167;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Similarity to hypothetical <it>S. pombe </it>protein</p>
                     </c>
                     <c ca="center">
                 