<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2007-8-6-r113</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Method</dochead>
      <bibl>
         <title>
            <p>LongSAGE profiling of nine human embryonic stem cell lines</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Hirst</snm>
               <fnm>Martin</fnm>
               <insr iid="I1"/>
               <email>mhirst@bcgsc.ca</email>
            </au>
            <au id="A2">
               <snm>Delaney</snm>
               <fnm>Allen</fnm>
               <insr iid="I1"/>
               <email>adelaney@bcgsc.ca</email>
            </au>
            <au id="A3">
               <snm>Rogers</snm>
               <mi>A</mi>
               <fnm>Sean</fnm>
               <insr iid="I1"/>
               <email>srogers@bcgsc.ca</email>
            </au>
            <au id="A4">
               <snm>Schnerch</snm>
               <fnm>Angelique</fnm>
               <insr iid="I1"/>
               <email>angels@bcgsc.ca</email>
            </au>
            <au id="A5">
               <snm>Persaud</snm>
               <mi>R</mi>
               <fnm>Deryck</fnm>
               <insr iid="I1"/>
               <email>dpersaud@bcgsc.ca</email>
            </au>
            <au id="A6">
               <snm>O'Connor</snm>
               <mi>D</mi>
               <fnm>Michael</fnm>
               <insr iid="I2"/>
               <email>moconnor@bccrc.ca</email>
            </au>
            <au id="A7">
               <snm>Zeng</snm>
               <fnm>Thomas</fnm>
               <insr iid="I1"/>
               <email>tzeng@bcgsc.ca</email>
            </au>
            <au id="A8">
               <snm>Moksa</snm>
               <fnm>Michelle</fnm>
               <insr iid="I1"/>
               <email>mmoksa@bcgsc.ca</email>
            </au>
            <au id="A9">
               <snm>Fichter</snm>
               <fnm>Keith</fnm>
               <insr iid="I1"/>
               <email>kfichter@bcgsc.ca</email>
            </au>
            <au id="A10">
               <snm>Mah</snm>
               <fnm>Diana</fnm>
               <insr iid="I1"/>
               <email>dmah@bcgsc.ca</email>
            </au>
            <au id="A11">
               <snm>Go</snm>
               <fnm>Anne</fnm>
               <insr iid="I1"/>
               <email>ago@bcgsc.ca</email>
            </au>
            <au id="A12">
               <snm>Morin</snm>
               <mi>D</mi>
               <fnm>Ryan</fnm>
               <insr iid="I1"/>
               <email>rmorin@bcgsc.ca</email>
            </au>
            <au id="A13">
               <snm>Baross</snm>
               <fnm>Agnes</fnm>
               <insr iid="I1"/>
               <email>abaross@bcgsc.ca</email>
            </au>
            <au id="A14">
               <snm>Zhao</snm>
               <fnm>Yongjun</fnm>
               <insr iid="I1"/>
               <email>yzhao@bcgsc.ca</email>
            </au>
            <au id="A15">
               <snm>Khattra</snm>
               <fnm>Jaswinder</fnm>
               <insr iid="I1"/>
               <email>jkhattra@bcgsc.ca</email>
            </au>
            <au id="A16">
               <snm>Prabhu</snm>
               <fnm>Anna-Liisa</fnm>
               <insr iid="I1"/>
               <email>aprabhu@bcgsc.ca</email>
            </au>
            <au id="A17">
               <snm>Pandoh</snm>
               <fnm>Pawan</fnm>
               <insr iid="I1"/>
               <email>ppandoh@bcgsc.ca</email>
            </au>
            <au id="A18">
               <snm>McDonald</snm>
               <fnm>Helen</fnm>
               <insr iid="I1"/>
               <email>hmcdonald@bcgsc.ca</email>
            </au>
            <au id="A19">
               <snm>Asano</snm>
               <fnm>Jennifer</fnm>
               <insr iid="I1"/>
               <email>jasono@bcgsc.ca</email>
            </au>
            <au id="A20">
               <snm>Dhalla</snm>
               <fnm>Noreen</fnm>
               <insr iid="I1"/>
               <email>ndhalla@bcgsc.ca</email>
            </au>
            <au id="A21">
               <snm>Ma</snm>
               <fnm>Kevin</fnm>
               <insr iid="I1"/>
               <email>kma@bcgsc.ca</email>
            </au>
            <au id="A22">
               <snm>Lee</snm>
               <fnm>Stephanie</fnm>
               <insr iid="I1"/>
               <email>slee@bcgsc.ca</email>
            </au>
            <au id="A23">
               <snm>Ally</snm>
               <fnm>Adrian</fnm>
               <insr iid="I1"/>
               <email>aally@bcgsc.ca</email>
            </au>
            <au id="A24">
               <snm>Chahal</snm>
               <fnm>Neil</fnm>
               <insr iid="I1"/>
               <email>nchahal@bcgsc.ca</email>
            </au>
            <au id="A25">
               <snm>Menzies</snm>
               <fnm>Stephanie</fnm>
               <insr iid="I1"/>
               <email>smenzies@bcgsc.ca</email>
            </au>
            <au id="A26">
               <snm>Siddiqui</snm>
               <fnm>Asim</fnm>
               <insr iid="I1"/>
               <email>asiddiqui@bcgsc.ca</email>
            </au>
            <au id="A27">
               <snm>Holt</snm>
               <fnm>Robert</fnm>
               <insr iid="I1"/>
               <email>rholt@bcgsc.ca</email>
            </au>
            <au id="A28">
               <snm>Jones</snm>
               <fnm>Steven</fnm>
               <insr iid="I1"/>
               <email>sjones@bcgsc.ca</email>
            </au>
            <au id="A29">
               <snm>Gerhard</snm>
               <mi>S</mi>
               <fnm>Daniela</fnm>
               <insr iid="I3"/>
               <email>gerhardd@mail.nih.gov</email>
            </au>
            <au id="A30">
               <snm>Thomson</snm>
               <mi>A</mi>
               <fnm>James</fnm>
               <insr iid="I4"/>
               <email>thomson@primate.wisc.edu</email>
            </au>
            <au id="A31">
               <snm>Eaves</snm>
               <mi>J</mi>
               <fnm>Connie</fnm>
               <insr iid="I2"/>
               <email>ceaves@bccrc.ca</email>
            </au>
            <au id="A32" ca="yes">
               <snm>Marra</snm>
               <mi>A</mi>
               <fnm>Marco</fnm>
               <insr iid="I1"/>
               <email>mmarra@bcgsc.ca</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Genome Sciences Centre, British Columbia Cancer Agency, Vancouver, British Columbia, Canada, V5Z 1L3</p>
            </ins>
            <ins id="I2">
               <p>Terry Fox Laboratory, British Columbia Cancer Agency, Vancouver, British Columbia, Canada, V5Z 1L3</p>
            </ins>
            <ins id="I3">
               <p>National Cancer Institute, National Institutes of Health, Bethesda, Maryland 20892, USA</p>
            </ins>
            <ins id="I4">
               <p>Wisconsin National Primate Research Centre and Department of Anatomy, School of Medicine, University of Wisconsin, Madison, Wisconsin 53715, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>6</issue>
         <fpage>R113</fpage>
         <url>http://genomebiology.com/2007/8/6/R113</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17570852</pubid>
               <pubid idtype="doi">10.1186/gb-2007-8-6-r113</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>18</day>
               <month>12</month>
               <year>2006</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>23</day>
               <month>4</month>
               <year>2007</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>14</day>
               <month>6</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>14</day>
               <month>06</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Hirst et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Human embryonic stem cell transcripts</p>
      </shorttitle>
      <shortabs>
         <p>Analysis of a 2.6 million longSAGE sequence tag resource generated from nine human embryonic stem cell lines reveals an enrichment of RNA binding proteins and novel ES-specific transcripts.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <p>To facilitate discovery of novel human embryonic stem cell (ESC) transcripts, we generated 2.5 million LongSAGE tags from 9 human ESC lines. Analysis of this data revealed that ESCs express proportionately more RNA binding proteins compared with terminally differentiated cells, and identified novel ESC transcripts, at least one of which may represent a marker of the pluripotent state.</p>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010005">Development</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010016">Molecular biology</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Embryonic stem cells (ESCs) can be derived from the inner cell mass of blastocysts and are defined by their ability to be propagated indefinitely as undifferentiated cells with the potential, upon appropriate stimulation, to generate cell types representing all three embryonic germ layers <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Since the first reported isolation of human cells with these properties <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, the derivation of more than 150 such lines has been described. This large collection of human ESC lines provides opportunities for understanding the earliest stages of human embryo and tissue development, as well as for elucidating the mechanisms that can permanently maintain pluripotency. Studies of mouse ESCs have defined a number of genes that appear to play key roles in this process, including those encoding Oct4 <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>, Nanog <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>, Sox2 <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>, FoxD3 <abbrgrp><abbr bid="B7">7</abbr></abbrgrp> and fibroblast growth factor-4 <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. Comparisons of mouse and human ESCs have also revealed a number of conserved signaling pathways, including those involving JAK/STAT, transforming growth factor-&#946; and fibroblast growth factor <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. However, cross-species analysis of microarray data <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp> and expressed sequence tag (EST) resources <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp> suggest that additional molecular regulators of ESC self-renewal may exist and that likely candidates are heterochronic genes, microRNAs, genes involved in telomeric regulation and polycomb group repressors <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>.</p>
         <p>Microarray-based approaches have been used to define the transcriptomes of numerous human ESC lines, including BG01, BG02, WA01, WA07, WA09, WA13, WA14, TE06, UC01 and UC06 <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr></abbrgrp>. These studies provide a rich resource for cell line comparisons; however, incomplete annotation of the genome and inherent biases in the microarray technology limit interpretation to well characterized, abundantly expressed transcripts <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr></abbrgrp>. A number of DNA sequence-based approaches have also been used to study the human ESC transcriptome, including EST analysis <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>, serial analysis of gene expression (SAGE) <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and massively parallel signature sequencing (MPSS) <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B18">18</abbr></abbrgrp>. Comparisons of these datasets have been used to search for genes that might be required for maintenance of pluripotency <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B22">22</abbr></abbrgrp> but, interestingly, exhibit limited overlap between datasets, in some cases as low as 1% <abbrgrp><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>, possibly because of the different technologies employed in different studies <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. The fact that a large proportion of transcripts expressed in ESCs do not correspond to annotated genes has further confounded the yields of such comparisons <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. To generate a transcript discovery resource complementary to previous work, we undertook a large scale gene expression analysis of nine different human ESC lines, maintained as undifferentiated cells, using the long serial analysis of gene expression (LongSAGE <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>) approach.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Digital gene expression profiling of nine human ESC lines reveals an enrichment of RNA binding proteins</p>
            </st>
            <p>LongSAGE libraries were constructed using total RNA purified from nine different human ESC lines cultured as undifferentiated cells by serial passaging on mouse embryonic fibroblast (MEF) feeder layers <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> (Table <tblr tid="T1">1</tblr>). To enable detection of the majority of the moderately to abundantly expressed transcripts, we sequenced most libraries to a depth of approximately 200,000 tags. However, in one case (the library prepared from WA09 cells), we generated 468,252 tags. To ensure that tags included in the libraries were not contaminated with transcripts expressed from the MEF feeder layers, all tags matching the mouse reference genome sequence were excluded from further analysis (Additional data file 1). SAGE libraries were analyzed individually, and also as an electronically pooled 'meta-library' containing 2.5 million tags representing 379,645 different tag sequences. Of these, 73% were observed only once ('singletons'). Our previous experience indicated that singletons are enriched for experimental artifacts (sequencing errors, reverse transcriptase artifacts, and so on) as well as rare transcripts <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. To reduce the artifacts, we assigned confidence values to each tag sequence and selected for analysis only high quality tags as described <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. This filtering reduced the total number of different tag sequences to 268,515 (Additional data file 2). Of these, 40% of the singletons and 87% of the non-singletons could be mapped to publicly available gene expression resources.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Human embryonic stem cell lines profiled in this study</p>
               </caption>
               <tblbdy cols="9">
                  <r>
                     <c ca="left">
                        <p>Provider's code</p>
                     </c>
                     <c ca="left">
                        <p>NIH code</p>
                     </c>
                     <c ca="left">
                        <p>Library identifier</p>
                     </c>
                     <c ca="center">
                        <p>Total no. of tags</p>
                     </c>
                     <c ca="center">
                        <p>Passage</p>
                     </c>
                     <c ca="left">
                        <p>Gender</p>
                     </c>
                     <c ca="left">
                        <p>Feeder line</p>
                     </c>
                     <c ca="left">
                        <p>Growth medium</p>
                     </c>
                     <c ca="center">
                        <p>bFGF-2 concentration (ng/ml)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="9">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H7</p>
                     </c>
                     <c ca="left">
                        <p>WA07</p>
                     </c>
                     <c ca="left">
                        <p>SHE13</p>
                     </c>
                     <c ca="center">
                        <p>272,470</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="left">
                        <p>Female</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H9</p>
                     </c>
                     <c ca="left">
                        <p>WA09</p>
                     </c>
                     <c ca="left">
                        <p>SHES2</p>
                     </c>
                     <c ca="center">
                        <p>468,040</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="left">
                        <p>Female</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H14</p>
                     </c>
                     <c ca="left">
                        <p>WA14</p>
                     </c>
                     <c ca="left">
                        <p>SHE14</p>
                     </c>
                     <c ca="center">
                        <p>212,211</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H13</p>
                     </c>
                     <c ca="left">
                        <p>WA13</p>
                     </c>
                     <c ca="left">
                        <p>SHE15</p>
                     </c>
                     <c ca="center">
                        <p>221,117</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>HES-3</p>
                     </c>
                     <c ca="left">
                        <p>ES03</p>
                     </c>
                     <c ca="left">
                        <p>SHE10</p>
                     </c>
                     <c ca="center">
                        <p>206,292</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c ca="left">
                        <p>Female</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (B-81)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>HES-4</p>
                     </c>
                     <c ca="left">
                        <p>ES04</p>
                     </c>
                     <c ca="left">
                        <p>SHE11</p>
                     </c>
                     <c ca="center">
                        <p>209,245</p>
                     </c>
                     <c ca="center">
                        <p>36</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (B-81)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UC06</p>
                     </c>
                     <c ca="left">
                        <p>HSF-6</p>
                     </c>
                     <c ca="left">
                        <p>SHES9</p>
                     </c>
                     <c ca="center">
                        <p>189,714</p>
                     </c>
                     <c ca="center">
                        <p>50</p>
                     </c>
                     <c ca="left">
                        <p>Female</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H1</p>
                     </c>
                     <c ca="left">
                        <p>WA01</p>
                     </c>
                     <c ca="left">
                        <p>SHE16</p>
                     </c>
                     <c ca="center">
                        <p>218,214</p>
                     </c>
                     <c ca="center">
                        <p>54</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>None: matrigel</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12*</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>H1</p>
                     </c>
                     <c ca="left">
                        <p>WA01</p>
                     </c>
                     <c ca="left">
                        <p>SHE17</p>
                     </c>
                     <c ca="center">
                        <p>276,302</p>
                     </c>
                     <c ca="center">
                        <p>31</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts (CF-1)</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>hESBGN-01</p>
                     </c>
                     <c ca="left">
                        <p>BG01</p>
                     </c>
                     <c ca="left">
                        <p>SHE19</p>
                     </c>
                     <c ca="center">
                        <p>201,699</p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c ca="left">
                        <p>Male</p>
                     </c>
                     <c ca="left">
                        <p>Mouse embryonic fibroblasts</p>
                     </c>
                     <c ca="left">
                        <p>DMEM:F12</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Mouse embryonic fibroblast conditioned media. bFGF-2, basic fibroblast growth factor.</p>
               </tblfn>
            </tbl>
            <p>To investigate the similarities and differences between the libraries, we performed hierarchical clustering using Pearson correlation coefficients <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. For this comparison, we included data from four LongSAGE libraries generated from terminally differentiated cells (available from the Cancer Genome Anatomy Project <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>) to provide an 'out-group'. Figure <figr fid="F1">1</figr> shows that the libraries for all nine human ESC lines form a cluster distinct from the libraries for the four terminally differentiated cell preparations, as expected. The ESC libraries also do not cluster together based on obvious commonalities between the lines, such as the MEF feeder lines used, sex chromosome karyotype or passage number.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Pearson distance tree of human ESC libraries</p>
               </caption>
               <text>
                  <p>Pearson distance tree of human ESC libraries. ESC libraries do not cluster based on the genotype (compare WA01 and WA01-M), MEF feeder line (ES03 and ES04) or passage number (compare WA07 and WA01). Brain sub nig, LSAGE_Brain_normal_substantia_nigra_B_1; Breast epi, LSAGE_Breast_normal_myoepithelium_AP_IDC7; Pancreas, LSAGE_Pancreas_normal_B_1; Vascular endo; LSAGE_Vascular_endothelium_normal_liver_associated_AP_NLEC1.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-1"/>
            </fig>
            <p>To assess the representation of known genes in the nine human ESC transcriptomes, we compared our data to other human sequence tag-based resources <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>. Highly expressed genes in each of the human ESC libraries showed significant overlap with previously published ESC SAGE <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and MPSS datasets <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, but the diversity of genes identified by our LongSAGE data was significantly greater (Figure <figr fid="F2">2</figr>). To explore the functions encoded by transcripts detected in the LongSAGE libraries, we divided the genes (identified by uniquely mapping tags) into their respective Gene Ontology (GO) slim categories <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Pair-wise comparisons of individual human ESC libraries showed little difference in the relative proportions of each of the GO slim categories (Additional data file 3). In contrast, a similar comparison of individual or pooled ESC libraries to the differentiated cell lines showed a statistically significant increase, in the ESC libraries, in the proportion of transcripts encoding RNA binding proteins and mitochondrial proteins (<it>P </it>= 1.8 &#215; 10<sup>-7 </sup>and 1.0 &#215; 10<sup>-6</sup>, respectively, by one-sided <it>t</it>-tests).</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Coverage of the MGC by ESC sequence tag-based transcriptomes</p>
               </caption>
               <text>
                  <p>Coverage of the MGC by ESC sequence tag-based transcriptomes. Unambiguous tags from published MPSS and short SAGE ESC transcriptomes were mapped to genes in the MGC and compared to identically treated LongSAGE transcriptomes. To assess the impact of tag number on gene identification, the proportion of MGC sequences detected was plotted against increasing numbers of tags. Coverage of the MGC increases with increased numbers of tags for ESC LongSAGE libraries even at levels above 200,000 tags. In contrast, coverage of the MGC by the MPSS library plateaus early with little increase in coverage observed with increased sampling depth (MPSS). Coverage of the MGC by the short SAGE ESC libraries (ES03_SAGE and ES04_SAGE) is significantly lower due to the presence of ambiguous tags.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-2"/>
            </fig>
            <p>To investigate the potential functional significance of increased expression of transcripts for RNA binding proteins, we compared the global splicing profile of the ESCs and the four libraries of terminally differentiated cells. This was done by performing pair-wise comparisons across all transcripts in both the ESC and the terminally differentiated cell meta-libraries with the position of each uniquely mapped LongSAGE tag for which a transcript was known. These analyses did not reveal any difference in global transcript splicing patterns between the two meta-libraries, although differences in the relative abundance of specific transcript isoforms were identified. Of a total of 70 transcript isoforms found to be differentially expressed between the ESC and differentiated cell meta-libraries, 8 demonstrated statistical significance (<it>P </it>&lt; 3.0 &#215; 10<sup>-5</sup>; Additional data file 4). The most significantly affected transcript (lowest <it>P </it>value) encoded Secreted frizzled-related protein-1 (Sfrp1), a well characterized antagonist of WNT signaling. Our analysis suggested that the two isoforms of Sfrp1 we identified either retained or lost the 3' untranslated region (UTR; Figure <figr fid="F3">3</figr>). Only the transcript isoform lacking the 3' UTR was found exclusively in the ESCs. Closer examination of the 3' UTR region revealed putative miRNA target sites for two evolutionarily conserved miRNAs <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>, the mouse homologues of which were found previously to be expressed in murine ESCs <abbrgrp><abbr bid="B35">35</abbr></abbrgrp> (Figure <figr fid="F3">3</figr>). Given that activation of the canonical WNT signaling pathway induces differentiation and cell proliferation <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>, we speculate that the expression of Sfrp1 may be regulated through miRNA-directed translational repression and that this regulation is bypassed through alternative 3' end formation in pluripotent ESCs.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Differentially expressed isoforms (as predicted by LongSAGE tag positions) for the <it>Srfp1 </it>transcript (see text)</p>
               </caption>
               <text>
                  <p>Differentially expressed isoforms (as predicted by LongSAGE tag positions) for the <it>Srfp1 </it>transcript (see text). The tag sequence at position 9 results in the loss of the 3' UTR region targeted by evolutionarily conserved miRNAs. Putative miRNA target sites were predicted using miRanda [34] and are represented by hashed boxes.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-3"/>
            </fig>
            <p>We next examined the expression of transcripts that encode previously identified markers of undifferentiated ESCs. These include transcription factors such as Oct 4 <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>, Nanog <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>, the cell surface proteins tdgf-1 <abbrgrp><abbr bid="B38">38</abbr></abbrgrp> and thy-1 <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>, Lck <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, connexin cx43 <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>, Rex1 <abbrgrp><abbr bid="B41">41</abbr></abbrgrp> and Lefty-A and Lefty-B <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. In addition, we looked for transcripts from six genes associated with early stages of ESC differentiation <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. Table <tblr tid="T2">2</tblr> shows the normalized gene expression levels across all cell lines. A similar pattern of expression is observed across all lines, with the exception of HSF-6, which exhibited a decrease in expression of ESC marker genes and a concomitant increase in expression of genes associated with differentiation, including alpha-fetoprotein. Notably, expression of Nanog, a divergent homeodomain protein that directs propagation of undifferentiated mouse ESCs <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>, was not detected in the HSF-6 library. These features are consistent with the closer relationship of the HSF-6 library to libraries from differentiated tissues than to other ESC libraries (Figure <figr fid="F1">1</figr>). We therefore excluded the HSF-6 library from further analysis.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Expression of undifferentiated and differentiated ESC markers</p>
               </caption>
               <tblbdy cols="14">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="3" ca="center">
                        <p>Meta-libraries</p>
                     </c>
                     <c cspan="10" ca="center">
                        <p>Embryonic stem cell libraries</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Markers</p>
                     </c>
                     <c ca="center">
                        <p>CG-Meta</p>
                     </c>
                     <c ca="center">
                        <p>CGN-Meta</p>
                     </c>
                     <c ca="center">
                        <p>ESC-Meta</p>
                     </c>
                     <c ca="center">
                        <p>WA01</p>
                     </c>
                     <c ca="center">
                        <p>WA01-M</p>
                     </c>
                     <c ca="center">
                        <p>WA07</p>
                     </c>
                     <c ca="center">
                        <p>WA09</p>
                     </c>
                     <c ca="center">
                        <p>WA13</p>
                     </c>
                     <c ca="center">
                        <p>WA14</p>
                     </c>
                     <c ca="center">
                        <p>HSF-6</p>
                     </c>
                     <c ca="center">
                        <p>ES03</p>
                     </c>
                     <c ca="center">
                        <p>ES04</p>
                     </c>
                     <c ca="center">
                        <p>BG01</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="14">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Undiff</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cx43</p>
                     </c>
                     <c ca="center">
                        <p>390.379</p>
                     </c>
                     <c ca="center">
                        <p>799.779</p>
                     </c>
                     <c ca="center">
                        <p>1635.9</p>
                     </c>
                     <c ca="center">
                        <p>1806.3</p>
                     </c>
                     <c ca="center">
                        <p>1182.32</p>
                     </c>
                     <c ca="center">
                        <p>1501.08</p>
                     </c>
                     <c ca="center">
                        <p>1155.02</p>
                     </c>
                     <c ca="center">
                        <p>1791.03</p>
                     </c>
                     <c ca="center">
                        <p>1720.1</p>
                     </c>
                     <c ca="center">
                        <p>970.938</p>
                     </c>
                     <c ca="center">
                        <p>2127.51</p>
                     </c>
                     <c ca="center">
                        <p>1486.37</p>
                     </c>
                     <c ca="center">
                        <p>2538.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Oct4</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1093.07</p>
                     </c>
                     <c ca="center">
                        <p>1433.46</p>
                     </c>
                     <c ca="center">
                        <p>1397.71</p>
                     </c>
                     <c ca="center">
                        <p>634.932</p>
                     </c>
                     <c ca="center">
                        <p>883.381</p>
                     </c>
                     <c ca="center">
                        <p>972.402</p>
                     </c>
                     <c ca="center">
                        <p>1376.08</p>
                     </c>
                     <c ca="center">
                        <p>432.023</p>
                     </c>
                     <c ca="center">
                        <p>1280.41</p>
                     </c>
                     <c ca="center">
                        <p>1247.4</p>
                     </c>
                     <c ca="center">
                        <p>1665.95</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Tdgf1</p>
                     </c>
                     <c ca="center">
                        <p>13.9733</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>665.447</p>
                     </c>
                     <c ca="center">
                        <p>716.729</p>
                     </c>
                     <c ca="center">
                        <p>1131.92</p>
                     </c>
                     <c ca="center">
                        <p>767.057</p>
                     </c>
                     <c ca="center">
                        <p>252.394</p>
                     </c>
                     <c ca="center">
                        <p>339.21</p>
                     </c>
                     <c ca="center">
                        <p>801.146</p>
                     </c>
                     <c ca="center">
                        <p>329.585</p>
                     </c>
                     <c ca="center">
                        <p>374.871</p>
                     </c>
                     <c ca="center">
                        <p>578.3</p>
                     </c>
                     <c ca="center">
                        <p>1199.88</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Sox2</p>
                     </c>
                     <c ca="center">
                        <p>43.6666</p>
                     </c>
                     <c ca="center">
                        <p>42.8454</p>
                     </c>
                     <c ca="center">
                        <p>406.121</p>
                     </c>
                     <c ca="center">
                        <p>398.183</p>
                     </c>
                     <c ca="center">
                        <p>265.793</p>
                     </c>
                     <c ca="center">
                        <p>352.332</p>
                     </c>
                     <c ca="center">
                        <p>675.905</p>
                     </c>
                     <c ca="center">
                        <p>257.8</p>
                     </c>
                     <c ca="center">
                        <p>518.389</p>
                     </c>
                     <c ca="center">
                        <p>320.677</p>
                     </c>
                     <c ca="center">
                        <p>350.528</p>
                     </c>
                     <c ca="center">
                        <p>358.451</p>
                     </c>
                     <c ca="center">
                        <p>416.489</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Dppa4</p>
                     </c>
                     <c ca="center">
                        <p>11.3533</p>
                     </c>
                     <c ca="center">
                        <p>4.76059</p>
                     </c>
                     <c ca="center">
                        <p>386.637</p>
                     </c>
                     <c ca="center">
                        <p>463.34</p>
                     </c>
                     <c ca="center">
                        <p>595.745</p>
                     </c>
                     <c ca="center">
                        <p>572.54</p>
                     </c>
                     <c ca="center">
                        <p>290.895</p>
                     </c>
                     <c ca="center">
                        <p>303.028</p>
                     </c>
                     <c ca="center">
                        <p>494.826</p>
                     </c>
                     <c ca="center">
                        <p>231.6</p>
                     </c>
                     <c ca="center">
                        <p>189.87</p>
                     </c>
                     <c ca="center">
                        <p>430.141</p>
                     </c>
                     <c ca="center">
                        <p>421.447</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lefty-b</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>14.2818</p>
                     </c>
                     <c ca="center">
                        <p>245.218</p>
                     </c>
                     <c ca="center">
                        <p>173.753</p>
                     </c>
                     <c ca="center">
                        <p>9.16532</p>
                     </c>
                     <c ca="center">
                        <p>77.0727</p>
                     </c>
                     <c ca="center">
                        <p>32.0841</p>
                     </c>
                     <c ca="center">
                        <p>90.456</p>
                     </c>
                     <c ca="center">
                        <p>348.734</p>
                     </c>
                     <c ca="center">
                        <p>102.438</p>
                     </c>
                     <c ca="center">
                        <p>73.0268</p>
                     </c>
                     <c ca="center">
                        <p>258.084</p>
                     </c>
                     <c ca="center">
                        <p>233.036</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rex-1</p>
                     </c>
                     <c ca="center">
                        <p>38.4266</p>
                     </c>
                     <c ca="center">
                        <p>14.2818</p>
                     </c>
                     <c ca="center">
                        <p>105.813</p>
                     </c>
                     <c ca="center">
                        <p>112.215</p>
                     </c>
                     <c ca="center">
                        <p>82.4879</p>
                     </c>
                     <c ca="center">
                        <p>80.7428</p>
                     </c>
                     <c ca="center">
                        <p>132.614</p>
                     </c>
                     <c ca="center">
                        <p>31.6596</p>
                     </c>
                     <c ca="center">
                        <p>98.965</p>
                     </c>
                     <c ca="center">
                        <p>40.0846</p>
                     </c>
                     <c ca="center">
                        <p>160.659</p>
                     </c>
                     <c ca="center">
                        <p>62.1314</p>
                     </c>
                     <c ca="center">
                        <p>158.662</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lefty-a</p>
                     </c>
                     <c ca="center">
                        <p>0.873332</p>
                     </c>
                     <c ca="center">
                        <p>4.76059</p>
                     </c>
                     <c ca="center">
                        <p>102.454</p>
                     </c>
                     <c ca="center">
                        <p>54.2976</p>
                     </c>
                     <c ca="center">
                        <p>9.16532</p>
                     </c>
                     <c ca="center">
                        <p>25.6909</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>31.6596</p>
                     </c>
                     <c ca="center">
                        <p>70.6894</p>
                     </c>
                     <c ca="center">
                        <p>22.2692</p>
                     </c>
                     <c ca="center">
                        <p>24.3423</p>
                     </c>
                     <c ca="center">
                        <p>76.4694</p>
                     </c>
                     <c ca="center">
                        <p>168.579</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nanog</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>89.6892</p>
                     </c>
                     <c ca="center">
                        <p>65.1572</p>
                     </c>
                     <c ca="center">
                        <p>77.9051</p>
                     </c>
                     <c ca="center">
                        <p>110.104</p>
                     </c>
                     <c ca="center">
                        <p>66.3071</p>
                     </c>
                     <c ca="center">
                        <p>135.684</p>
                     </c>
                     <c ca="center">
                        <p>70.6894</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>92.5006</p>
                     </c>
                     <c ca="center">
                        <p>195.953</p>
                     </c>
                     <c ca="center">
                        <p>44.6238</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nodal</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>47.6999</p>
                     </c>
                     <c ca="center">
                        <p>21.719</p>
                     </c>
                     <c ca="center">
                        <p>4.58266</p>
                     </c>
                     <c ca="center">
                        <p>40.3714</p>
                     </c>
                     <c ca="center">
                        <p>6.41681</p>
                     </c>
                     <c ca="center">
                        <p>58.7964</p>
                     </c>
                     <c ca="center">
                        <p>84.8272</p>
                     </c>
                     <c ca="center">
                        <p>80.1692</p>
                     </c>
                     <c ca="center">
                        <p>48.6846</p>
                     </c>
                     <c ca="center">
                        <p>52.5727</p>
                     </c>
                     <c ca="center">
                        <p>64.4566</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Foxd3</p>
                     </c>
                     <c ca="center">
                        <p>1.74666</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>23.1781</p>
                     </c>
                     <c ca="center">
                        <p>28.9587</p>
                     </c>
                     <c ca="center">
                        <p>45.8266</p>
                     </c>
                     <c ca="center">
                        <p>11.0104</p>
                     </c>
                     <c ca="center">
                        <p>32.0841</p>
                     </c>
                     <c ca="center">
                        <p>13.5684</p>
                     </c>
                     <c ca="center">
                        <p>9.42524</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>24.3422</p>
                     </c>
                     <c ca="center">
                        <p>19.1174</p>
                     </c>
                     <c ca="center">
                        <p>49.582</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Dppa2</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>14.7803</p>
                     </c>
                     <c ca="center">
                        <p>18.0992</p>
                     </c>
                     <c ca="center">
                        <p>36.6613</p>
                     </c>
                     <c ca="center">
                        <p>14.6805</p>
                     </c>
                     <c ca="center">
                        <p>4.27787</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>9.42525</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>4.86845</p>
                     </c>
                     <c ca="center">
                        <p>14.338</p>
                     </c>
                     <c ca="center">
                        <p>69.4148</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lck</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>13.1007</p>
                     </c>
                     <c ca="center">
                        <p>14.4794</p>
                     </c>
                     <c ca="center">
                        <p>13.748</p>
                     </c>
                     <c ca="center">
                        <p>18.3506</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>22.614</p>
                     </c>
                     <c ca="center">
                        <p>23.5631</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>4.86845</p>
                     </c>
                     <c ca="center">
                        <p>23.8967</p>
                     </c>
                     <c ca="center">
                        <p>14.8746</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>utf-1</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>11.0852</p>
                     </c>
                     <c ca="center">
                        <p>10.8595</p>
                     </c>
                     <c ca="center">
                        <p>18.3306</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>10.6947</p>
                     </c>
                     <c ca="center">
                        <p>13.5684</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>17.8154</p>
                     </c>
                     <c ca="center">
                        <p>14.6054</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>34.7074</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Tert-1</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>6.7183</p>
                     </c>
                     <c ca="center">
                        <p>10.8595</p>
                     </c>
                     <c ca="center">
                        <p>13.748</p>
                     </c>
                     <c ca="center">
                        <p>7.34026</p>
                     </c>
                     <c ca="center">
                        <p>10.6947</p>
                     </c>
                     <c ca="center">
                        <p>9.0456</p>
                     </c>
                     <c ca="center">
                        <p>4.71262</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>4.86845</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>abcg2</p>
                     </c>
                     <c ca="center">
                        <p>0.873332</p>
                     </c>
                     <c ca="center">
                        <p>14.2818</p>
                     </c>
                     <c ca="center">
                        <p>2.01549</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.58266</p>
                     </c>
                     <c ca="center">
                        <p>3.67013</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>4.86845</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.9582</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>dppa3</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1.34366</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.58266</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>2.13894</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>4.86845</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.9582</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>cx45</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0.67183</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.58266</p>
                     </c>
                     <c ca="center">
                        <p>3.67013</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>Diff</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>brachyury</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>3.35915</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>40.7052</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.45385</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>afp</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>8.06196</p>
                     </c>
                     <c ca="center">
                        <p>3.61984</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>8.55575</p>
                     </c>
                     <c ca="center">
                        <p>49.7508</p>
                     </c>
                     <c ca="center">
                        <p>4.71262</p>
                     </c>
                     <c ca="center">
                        <p>334.038</p>
                     </c>
                     <c ca="center">
                        <p>9.7369</p>
                     </c>
                     <c ca="center">
                        <p>4.77934</p>
                     </c>
                     <c ca="center">
                        <p>4.9582</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>krt15</p>
                     </c>
                     <c ca="center">
                        <p>52.3999</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0.335915</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4.58266</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>sox-1</p>
                     </c>
                     <c ca="center">
                        <p>8.73332</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0.335915</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>8.90769</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>fgf5-1</p>
                     </c>
                     <c ca="center">
                        <p>48.0332</p>
                     </c>
                     <c ca="center">
                        <p>14.2818</p>
                     </c>
                     <c ca="center">
                        <p>22.1704</p>
                     </c>
                     <c ca="center">
                        <p>21.719</p>
                     </c>
                     <c ca="center">
                        <p>27.496</p>
                     </c>
                     <c ca="center">
                        <p>11.0104</p>
                     </c>
                     <c ca="center">
                        <p>10.6947</p>
                     </c>
                     <c ca="center">
                        <p>13.5684</p>
                     </c>
                     <c ca="center">
                        <p>18.8505</p>
                     </c>
                     <c ca="center">
                        <p>17.8154</p>
                     </c>
                     <c ca="center">
                        <p>19.4738</p>
                     </c>
                     <c ca="center">
                        <p>28.676</p>
                     </c>
                     <c ca="center">
                        <p>19.8328</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Expression of defined ESC markers normalized to tags per million. Data for Meta ESCs (Meta-ESC), malignant (Meta-CG) and normal differentiated (Meta-CGN) cells are included for comparison. Diff, differentiated; undiff, undifferentiated.</p>
               </tblfn>
            </tbl>
            <p>A previous analysis of SAGE data generated using ES03 and ES04 cells showed that Rex1 was within the top 25 differentially expressed transcripts, with no Rex1 tags detected in the ES04 line and an absence of Rex1 expression in ES04 cells confirmed by quantitative and semi-quantitative real time (RT)-PCR <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. Interestingly, in our LongSAGE libraries, tags for Rex1 were present in all nine ESC libraries, including the library prepared from ES04 cells and there was less than a three-fold difference in Rex1 expression between ES03 and ES04 (Table <tblr tid="T2">2</tblr>).</p>
            <p>To generate a list of transcripts common to all libraries (excluding the HSF-6 library because of the differentiation markers found therein), we first identified tags from each library that uniquely mapped to transcripts within RefSeq <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> and the Mammalian Gene Collection (MGC) <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>. This analysis identified a set of 4,337 LongSAGE tags present in all libraries (Additional data file 5). Comparison of this list to those generated by previous MPSS and SAGE approaches revealed extensive (80%) concordance between the SAGE-based transcriptomes. In contrast, 52% of genes identified by MPSS were not found in either of the SAGE common gene lists. Some of this lack of concordance may be explained by differences in the tagging restriction enzyme used by the two protocols (<it>Nla</it>III for SAGE and <it>Dpn</it>1 for MPSS) and the fact that different mRNA preparations were used in each study. To further explore this lack of concordance, we compared the longSAGE and MPSS-derived gene lists to a common gene list derived from Affymetrix expression arrays generated from the same RNAs used to construct our LongSAGE libraries <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. The Affymetrix common gene set contained more than 80% of the LongSAGE common gene list (Additional data file 5) while MPSS contained only 68% of the genes on this list.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of novel ESC-specific transcripts</p>
            </st>
            <p>LongSAGE offers opportunities for discovering novel transcripts. These can be identified as tags that map uniquely to the genome but not to any available transcript resources. To look for these, we used the 2.5 million tag meta-library, which contained 379,645 unique tag sequences. Grouping LongSAGE tags that mapped to genomic locations in close proximity to one another <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> resulted in the identification of 24,593 transcription units. Of these, 14,588 did not overlap with known genes and were classified as novel. Most tags were expressed at low levels with 46% (6,672) identified by a single LongSAGE tag. Even though singletons are enriched for artifacts, many of these are likely to represent real transcripts, for two reasons: first, they map to the genome; and second, we <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> and others <abbrgrp><abbr bid="B46">46</abbr></abbrgrp> have shown previously that at least 70% of novel, singleton, high quality LongSAGE tags identify rare transcripts whose expression can be confirmed in RNA-dependent RT-PCR experiments.</p>
            <p>To further characterize these putative novel, low-abundance ESC library specific transcripts, we compared the ESC meta-library to publicly available data derived from 247 non-ESC SAGE libraries that together contained 654,491 unique tag sequences. This comparison identified 20,047 tag sequences found only in the human ESC meta-library (Additional data file 6). For subsequent analyses, we focused on those tags that uniquely mapped at least 2 kb away from any known gene. This analysis reduced the number of tags to 634 (Additional data file 7), of which 301 were found within genomic regions exhibiting sequence conservation between human and mouse or rat (Additional data file 8). We used rapid amplification of cDNA ends (RACE) <abbrgrp><abbr bid="B47">47</abbr><abbr bid="B48">48</abbr></abbrgrp> to clone the 5' ends of 52 of these (Additional data file 9). Alignment of the resulting sequences to the human genome revealed that 22 (40%) were spliced. An open reading frame (ORF) scan of the 52 RACE clone sequences using Bioperl <abbrgrp><abbr bid="B49">49</abbr></abbrgrp> tools and custom scripts identified 6 transcripts that encoded peptides longer than 100 amino acids in length. However, with the exception of one transcript (HA_003333) that overlapped the 3' end of the <it>MAPK2 </it>gene, none of the identified ORFs demonstrated Ka/Ks ratios suggestive of purifying selection <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. Hence, these transcripts may not encode proteins but may instead represent non-coding RNAs (ncRNAs).</p>
            <p>Four RACE clones were found to have genomic coordinates that overlapped with those of known transcripts (Additional data file 9). One of these (HA_003240; Figure <figr fid="F4">4</figr>) is of particular interest because it contains the entire coding sequence of the <it>Foxb1 </it>gene within its first intron. <it>Foxb1 </it>encodes a winged helix transcription factor involved in the development of the vertebrate central nervous system and <it>Foxb1</it><sup>-/- </sup>mice display phenotypes consistent with a requirement for this gene in both embryonic and postnatal stages of development <abbrgrp><abbr bid="B51">51</abbr><abbr bid="B52">52</abbr><abbr bid="B53">53</abbr></abbrgrp>. Interestingly, the ESC meta-library did not contain any tags corresponding to known <it>Foxb1 </it>transcripts except for a single <it>Foxb1 </it>tag in the HSF-6 library. This general lack of <it>Foxb1 </it>expression in ESCs and the genomic location of the <it>Foxb1 </it>gene within the first intron of HA_003240 are consistent with the notion that <it>Foxb1 </it>expression is repressed by expression of HA_003240, possibly by steric inhibition of the transcription initiation complex <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>. The HA_003240 sequence overlaps partially with an EST obtained from an undifferentiated human ESC line (CD049816), as well as with ESTs from an embryonic carcinoma line, a kidney carcinoma line and hypothalamus tissue (for example, DA713666, DB173211 and BI458015, respectively). Examination of the promoter region of HA_003240 revealed the presence of highly conserved sequences containing an Oct/Sox binding element, suggesting that HA_003240 expression may be maintained in pluripotent ESCs through the recruitment of an Oct4/Sox2 complex (Figure <figr fid="F4">4</figr>). <it>Oct4 </it>encodes a transcription factor that regulates a number of key human ESC markers, including Nanog, through co-operative binding with a Sox family member <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>. Given the documented role for Foxb1 in controlling the differentiation of neuronal cell types, the genomic organization of the <it>Foxb1 </it>locus is intriguing and suggests an interesting mechanism for negatively regulating <it>Foxb1 </it>expression in Oct4-expressing cells.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Structure of the HA_003240 transcript</p>
               </caption>
               <text>
                  <p>Structure of the HA_003240 transcript. Alignment of the 5' RACE sequence for HA_003240 to chromosome 15 sequences, showing its position relative to the nested single exon transcript <it>Foxb1 </it>and conservation of the Octamer/Sox binding elements within the promoter region.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-4"/>
            </fig>
            <p>Many pseudogenes have been identified in the human genome using homology-based approaches <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B57">57</abbr><abbr bid="B58">58</abbr></abbrgrp>. Pseudogenes are generally not transcribed due to their lack of functional promoters <abbrgrp><abbr bid="B59">59</abbr><abbr bid="B60">60</abbr></abbrgrp>. However, there are examples of pseudogenes that have retained or acquired functional promoters, leading to their transcription <abbrgrp><abbr bid="B61">61</abbr></abbrgrp>. Because of the low levels of expression of the 52 novel transcripts (on average, only 3 tags per million) we asked whether the 5' RACE clones were derived from expressed pseudogenes. Comparison of the RACE clone sequences to three computationally generated lists of known human pseudogenes <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B57">57</abbr><abbr bid="B58">58</abbr></abbrgrp> revealed only one clone (HA_003350) with a predicted pseudogene contained within its exon. Furthermore, with the exception of HA_003333, none of the novel transcript sequences showed significant sequence similarity to any known ORF (using a 70% ORF threshold <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>). Taken together, these analyses do not support the notion that the novel genes identified by our analysis are enriched for expressed pseudogenes.</p>
            <p>To more fully characterize a transcript identified by a singleton tag (Additional data file 9), we attempted to recover a full length transcript using 5' and 3' RACE and primers annealing within the terminal exon of the putative transcript. Alignment of the resulting candidate full length sequence to the human genome revealed a transcript that contained two introns (Figure <figr fid="F5">5</figr>). Examination of the genomic region surrounding this transcript showed that it resides in a region of the long arm of chromosome 3 (chr3:110,539,351-110,584,565) lacking annotated transcripts. The putative transcriptional start is located 266 bp from the transcriptional start site of <it>Dppa4</it>, a gene known to have an expression pattern in ESCs that is similar to that of <it>Oct4 </it><abbrgrp><abbr bid="B62">62</abbr></abbrgrp> (Figure <figr fid="F5">5</figr>). To investigate the possibility that this promoter region is regulated directly by Oct4, we looked for the presence of conserved Octamer and Sox (high mobility group (HMG)) elements. A single 20 bp region of cross-species sequence conservation was found that contains a consensus binding element for an Octamer/Sox dimmer, suggesting that the novel gene is regulated by Oct4/Sox2 (Figure <figr fid="F5">5</figr>; chr3: 110,539,180-111,539,200). In support of this finding, the conserved region was found to reside within a probe identified by chromatin immunoprecipitation (ChIP)/CHIP <abbrgrp><abbr bid="B63">63</abbr></abbrgrp> as a target of Oct4 and Sox2 (Probe spans chr3: 110,539,028-110,539,588). Taken together, these analyses suggest that both <it>Dppa4 </it>and the novel transcript are divergently transcribed from a common promoter bound by an Oct4/Sox complex. Based on its proximity to the <it>Dppa4 </it>gene we have named this novel transcript <it>Spd4 </it>(for 'shares promoter with <it>Dppa4</it>').</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Structure of the <it>Spd4 </it>transcript</p>
               </caption>
               <text>
                  <p>Structure of the <it>Spd4 </it>transcript. Alignment of the full-length <it>Spd4 </it>transcript on chromosome 3 showing its position relative to <it>Dppa4 </it>and conservation of the Octamer/Sox binding elements within the promoter region.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-5"/>
            </fig>
            <p>Comparison of the 5' RACE clone sequences to publicly available ESTs revealed 36 (69%) with matches to other ESTs, of which 7 were found only in data derived from pluripotent human ESC lines. One RACE clone that overlapped an EST derived from pluripotent human ESC lines (HA_003152) was also found to be expressed in all nine ESC lines studied here. BLAT <abbrgrp><abbr bid="B64">64</abbr></abbrgrp> alignment of the 5' RACE clone sequence to the human reference genome sequence revealed that HA_003152 contained two introns and resided within a genomic region that exhibited sequence similarity to long interspersed nuclear elements. An ORF scan revealed a 129 amino acid peptide encoded in the second exon with homology to the carboxyl terminus of the LINE <it>p40 </it>ORF.</p>
            <p>To explore the expression pattern of the HA_003152 transcript we used quantitative RT-PCR (qPCR) to compare transcript levels in RNA purified from human ESCs maintained under conditions that promote their maintenance in an undifferentiated state to RNA extracts obtained from human ESCs that had been stimulated to differentiate into embryoid bodies. To provide a comparative dataset we selected five additional novel transcripts for qPCR. In all cases, qPCR amplicons were designed to cross exon-exon boundaries. As controls we also monitored expression of <it>Oct4</it>, <it>Lin28 </it>and <it>Msx1 </it>in the same RNA preparations. Figure <figr fid="F6">6</figr> shows the expected expression pattern for the control gene set, with a reduction in expression of <it>Oct4 </it>and <it>Lin28 </it>in the human ESCs stimulated to differentiate into embryoid bodies and an up-regulation of expression of the early differentiation marker <it>Msx1</it>. Significant reduction of expression was observed in four of the six transcripts tested, including HA_003152, whose expression was undetectable at d30 (Figure <figr fid="F6">6</figr>). These transcripts are hence potential markers of pluripotency.</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Expression of selected transcripts during embryoid body differentiation</p>
               </caption>
               <text>
                  <p>Expression of selected transcripts during embryoid body differentiation. qPCR was used to monitor expression of selected transcripts in ESCs stimulated to differentiate into embryoid bodies. Three control markers, Oct4, Lin28 and Msx1, were included. Expression levels are reported as the mean of triplicate measurements and are normalized to GAPDH.</p>
               </text>
               <graphic file="gb-2007-8-6-r113-6"/>
            </fig>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>As part of the ongoing effort to elucidate mechanisms regulating ESC self-renewal, we generated 2.5 million LongSAGE tags from nine human ESC lines. Comparison of these data to libraries prepared from differentiated tissues identified a group of ESC-library specific transcripts and an enrichment of transcripts encoding mitochondrial and RNA binding proteins (by comparison to differentiated cells). RNA binding proteins play a role in the regulation of mRNA processing and examination of non-canonical longSAGE tags in the human ESC libraries suggest that these cells express a distinct collection of gene isoforms. One such isoform may bypass translational down regulation through the expression of a transcript lacking predicted miRNA target sequences.</p>
         <p>An emerging theme in digital gene expression profiling is the identification of a large class of transcripts that map uniquely to the genome, but cannot be localized to any known or computationally predicted transcripts. Tags in this class are predominantly found at relatively low levels. Analysis of the 2.5 million LongSAGE tags generated in the course of this study revealed 14,588 such tag sequences, a subset of which were found exclusively in human ESCs. As a first step towards understanding the relevance of these transcripts to ESC biology we generated 5' RACE clones for 52 novel apparently ESC-specific transcripts. Analyses of these transcripts revealed that the majority do not appear to encode proteins and do not overlap existing pseudogene predictions. One transcript was found to be expressed across all nine ESC lines we profiled and matched ESTs generated by others from ESCs. Its restricted expression pattern suggests that it may represent a novel transcriptional marker for the maintenance of pluripotentiality. In addition to the discovery of this potential marker, we also identified four novel transcripts that may participate in the regulation of expression of known genes, one of which is known to play a direct role in differentiation. Our analyses indicate that there are many previously undiscovered transcripts expressed in human ESCs and support the contention that sampling of SAGE libraries to depths beyond currently accepted practice is required to fully explore the coding potential of the mammalian transcriptome. To assess possible functions associated with such rare transcripts, we are actively pursuing the cloning and characterization of the remaining novel human ESC-specific transcripts identified in this study.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Cell culture and RNA isolation</p>
            </st>
            <p>Detailed information regarding the human ESC lines used in this study can be found at the NIH Stem Cell Information website <abbrgrp><abbr bid="B65">65</abbr></abbrgrp>. The passage numbers of the cells analyzed in this study are presented in Table <tblr tid="T1">1</tblr>. Total RNA was prepared using Trizol reagent (Invitrogen, Burlington, ON, USA) following the manufacturer's protocol and was assayed for quality and quantified using an Agilent 2100 Bioanalyzer (Agilent Technologies) and RNA 6000 Nano LabChip kit (Caliper Technologies, Hopkinton, MA, USA).</p>
         </sec>
         <sec>
            <st>
               <p>LongSAGE library construction</p>
            </st>
            <p>Nine LongSAGE <abbrgrp><abbr bid="B29">29</abbr></abbrgrp> libraries were constructed from 5-20 &#956;g of DNase I-treated total RNA as described <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> (DNase I from Invitrogen). LongSAGE data generated for this study are available through our embryonic stem cell transcriptomes website <abbrgrp><abbr bid="B45">45</abbr></abbrgrp> and through the CGAP web portal <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Novel transcript identification</p>
            </st>
            <p>LongSAGE tags of at least 99.9% accuracy (calculated using Phred <abbrgrp><abbr bid="B66">66</abbr><abbr bid="B67">67</abbr></abbrgrp> quality scores) from the meta-library were compared to 247 publicly available human SAGE libraries (GEO <abbrgrp><abbr bid="B68">68</abbr></abbrgrp>, Discovery db <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>). To allow direct comparison of the LongSAGE data to the 14 bp SAGE tags available in the public libraries, the 3' ends of the 21 bp tags were truncated <it>in silico </it>to form 14 bp tags. A total of 2,508,608 tags corresponding to 222,337 unique 14 bp tag sequences (379,465; 21 bp parental sequences) were utilized in this analysis. These tags were directly compared to all unique tags from the human SAGE libraries to generate a list of tags found solely in the ESC meta-library.</p>
            <p>Tag-to-gene mapping was performed using the comprehensive mapping of SAGE tags (CMOST) software <abbrgrp><abbr bid="B69">69</abbr></abbrgrp> as follows. Tags were mapped to various publicly available transcript databases in a hierarchical fashion with the highest quality transcript databases used first. As tags were mapped to a known transcript in a higher quality database, they were excluded from further analysis with subsequent lower quality databases to mitigate redundancies arising from lower quality DNA sequence resources. The following databases were used for CMOST tag-to-gene mapping in this order: MGC <abbrgrp><abbr bid="B70">70</abbr></abbrgrp>, RefSeq <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>, Ensembl transcripts <abbrgrp><abbr bid="B72">72</abbr></abbrgrp> (exon sequences only), Genbank Human Mitochondrial Sequence (accession AY289102.1), Genbank Non-coding sequences <abbrgrp><abbr bid="B73">73</abbr></abbrgrp>, Ensembl genes <abbrgrp><abbr bid="B72">72</abbr></abbrgrp> (1,000 bp UTR and intron sequences included), Ensembl ESTs <abbrgrp><abbr bid="B72">72</abbr></abbrgrp>, and Golden path genomic contigs (Genbank Human Genome Assembly Contigs build 34, January 2004 <abbrgrp><abbr bid="B73">73</abbr></abbrgrp>). In addition to allowing perfect matches, the CMOST approach attempts to account for single base permutations, insertions and deletions, improving the rate of tag-to-gene mapping.</p>
         </sec>
         <sec>
            <st>
               <p>SAGE tag-to-gene mapping</p>
            </st>
            <p>LongSAGE tags were mapped to known and computationally predicted transcripts using versions of the following databases available as of March, 2005: RefSeq <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>, RefSeqX <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>, Mammalian Gene Collection <abbrgrp><abbr bid="B70">70</abbr></abbrgrp>, and RefSeqGS <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>. Tags were also mapped to human genomic sequence using the NCBI Reference Sequence Genome database <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>, release 35, August 2004. From the genome sequence, a table was generated containing all 27.4 million potential SAGE tags adjacent to genomic <it>Nla</it>III restriction sites (CATG). Of these, our analysis defined a subset of 19.4 million genomic tag sequences that were unique within the genome.</p>
            <p>A second table was generated that stored information about exons: genome sequence contig, transcript orientation, exon number, exon boundary type and nucleotide positions of exon boundaries for all approximately 267,000 exons annotated on release 35 of the Reference Sequence genome. The LongSAGE tag sequences were compared to the unique genomic tag table, yielding sets of genomic positions for all tags in the library. These in turn were compared to the table of exon information, producing a mapping for each tag relative to annotated exons.</p>
         </sec>
         <sec>
            <st>
               <p>Statistical analysis</p>
            </st>
            <p>For the GO category comparisons, a standard <it>t</it>-test comparing two samples was used. The null hypothesis was that the two samples arose from populations with the same mean and standard deviation. The values within each sample were the number of GO categories represented in each library of the set, nine in the ESC set and four in the normal set. To account for variation due to library size, only the transcripts with the top 1,000 expression values were included. A one-sided <it>p </it>value was reported. Microsoft Excel was used to perform the computation.</p>
            <p>To select differentially expressed LongSAGE tags, the ESC and CGN meta-libraries were compared on a tag per tag basis to obtain a <it>p </it>value for the null hypothesis that the two tag frequencies arose from Poisson distributions with the same mean. This was derived using a normal approximation to the Poisson as described by Kal <it>et al</it>. <abbrgrp><abbr bid="B74">74</abbr></abbrgrp>. All transcripts that showed differences with a significance of <it>p </it>&lt; 0.05 were selected. Tag counts were converted to tags per million, and transcripts that differed by less than three-fold were eliminated. All pairs of tags existing within the same transcript were then listed if the differential expression for the two tags was in the opposite direction.</p>
         </sec>
         <sec>
            <st>
               <p>RACE</p>
            </st>
            <p>First strand 5' and 3' RACE ready cDNA was synthesized from 2.0 &#956;g of DNase I (DNA-<it>free</it>&#8482; kit; Ambion, Austin, TX, USA) treated RNA using the BD SMART RACE cDNA Amplification kit following the manufacturer's recommended protocol (BD Biosciences Clontech, Mountain View, CA, USA). Gene specific 5' RACE primers were designed using custom scripts and Primer 3 <abbrgrp><abbr bid="B75">75</abbr></abbrgrp> to lie downstream of the target LongSAGE tag with an optimal Tm of 68&#176;C (Additional data file 10). For 3' RACE reactions a series of primers were designed manually based on the 5' RACE clone sequence (Additional data file 10). The cDNA was amplified using the Phusion&#8482; High-Fidelity PCR Kit (MJ Research, Inc., Waltham, MA, USA) following the manufacturer's recommended protocol with the addition of DMSO to a final concentration of 3%. The cycling conditions consisted of an initial denaturation at 98&#176;C for 30 seconds followed by 10 touchdown PCR cycles starting with 98&#176;C for 10 seconds, 72&#176;C (decreased by 1&#176;C in each subsequent cycle) for 15 seconds, 72&#176;C for 30 seconds; then 29 cycles of 98&#176;C for 10 seconds, 62&#176;C for 15 seconds, 72&#176;C for 30 seconds; followed by an extension at 72&#176;C for 10 minutes. PCR product for each sample (10 &#956;l) was loaded on a 1.2% agarose gel and subjected to electrophoresis for 3.5 hours at 110 mA in 1&#215; TBE buffer (Tris/Boric Acid/EDTA). The gel was stained with SYBR Green (Mandel, Guelph, ON, Canada) and visualized using a Typhoon 9400 Variable Mode Imager (Amersham, Baie d'Urfe, PQ, Canada). Amplicons were extracted from the gel, purified and cloned into the pCR4<sup>&#174;</sup>-TOPO<sup>&#174; </sup>vector using the TOPO TA Cloning<sup>&#174; </sup>Kit for Sequencing (Invitrogen). Plasmid vectors were electroporated into bacterial cells, and recombinant clones were selected on agar plates containing appropriate antibiotics as described <abbrgrp><abbr bid="B76">76</abbr></abbrgrp>. Glycerol stocks were prepared from 12 individual clone isolates per amplicon and stored in 384-well plates. Clone inserts were sequenced on an ABI PRISM 3730 XL DNA Analyzer using BigDye primer cycle sequencing reagents (Applied Biosystems, Foster City, CA, USA).</p>
         </sec>
         <sec>
            <st>
               <p>Quantitative RT-PCR</p>
            </st>
            <p>RNA was obtained from H9 cells before and after induction of differentiation using a 30-day embryoid body protocol. Undifferentiated H9 cells maintained for 7 days on matrigel (BD Biosciences, San Jose, CA, USA) in media conditioned by mouse embryonic fibroblasts and supplemented with 4 ng/ml fibroblast growth factor (bFGF-2) were harvested for embryoid body formation. Briefly, the cells were incubated with TrypLE (Invitrogen) for 10 minutes at 37&#176;C and then collected by scraping. Resultant cell aggregates were subsequently cultured in non-adherent dishes using KOSR-based media without FGF2, for 15 to 30 days. At appropriate time-points RNA was extracted into Trizol. cDNA was synthesized from 2.0 ug of DNase I (DNA-<it>free</it>&#8482; kit, Ambion) treated total RNA using the SuperScript Choice System following the manufacturer's recommended protocol (Invitrogen). Gene specific primer pairs were designed using custom scripts and Primer 3 <abbrgrp><abbr bid="B75">75</abbr></abbrgrp> to amplify approximately 150 bp of the target gene with an optimal Tm of 68&#176;C (Additional data file 10). Whenever possible amplicons were designed to cross exon/intron boundaries. Amplification was performed in a 10 &#956;l reaction mixture containing 5 &#956;l of 2&#215; SYBR Green PCR Master Mix (Applied Biosystems), 2 &#956;l of template cDNA, and 250 pmol of the forward and reverse primer pair. After preparation of the reaction mixtures in 96-well plates, the plates were centrifuged at 800 rpm for 1 minute in an Eppendorf 5810 swing rotor centrifuge (Eppendorf, Westbury, NY, USA). Amplification and detection were performed on an ABI Prism 7600 Sequence Detection System (Applied Biosystems). The PCR protocol consisted of the following: a single cycle of 10 minute at 95&#176;C and 40 two-step cycles, with one cycle consisting of 15 seconds at 95&#176;C and 60 seconds at 60&#176;C. Results were analyzed as described <abbrgrp><abbr bid="B77">77</abbr></abbrgrp> using a GAPDH probe for normalization.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper. Additional data file <supplr sid="S1">1</supplr> is a summary of mouse specific tag types identified. Additional data file <supplr sid="S2">2</supplr> is a table of genomic mappings for 268,515 unique tag sequences found in nine independent human embryonic stem cell lines. Additional data file <supplr sid="S3">3</supplr> is a Gene Ontology analysis of nine independent human embryonic stem cells. Tag counts are expressed for each GO category for the top 1,000 by tag count. Additional data file <supplr sid="S4">4</supplr> lists statistically significant differentially expressed LongSAGE tags found between embryonic stem cells and terminally differentiated tissues. Additional data file <supplr sid="S5">5</supplr> is a table listing the 4,337 genes found in common across 8 undifferentiated human embryonic stem cell lines. Additional data file <supplr sid="S6">6</supplr> is a table listing the 20,047 LongSAGE tags exclusively expressed in embryonic stem cell lines. Additional data file <supplr sid="S7">7</supplr> is a table listing the 634 LongSAGE tags exclusively expressed in ESCs that uniquely map to the human genome at least 2 kb away from an annotated transcript. Additional data file <supplr sid="S8">8</supplr> is a table listing the 301 LongSAGE tags exclusively expressed in ESCs that uniquely map to species conserved regions of the human genome at least 2 kb away from an annotated transcript. Additional data file <supplr sid="S9">9</supplr> is a table listing the 52 ESC specific transcripts identified by 5' RACE. Additional data file <supplr sid="S10">10</supplr> lists the RACE and qPCR primer sequences used in this study.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Summary of mouse specific tag types identified</p>
            </caption>
            <text>
               <p>Summary of mouse specific tag types identified.</p>
            </text>
            <file name="gb-2007-8-6-r113-S1.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Genomic mappings for 268,515 unique tag sequences found in nine independent human embryonic stem cell lines</p>
            </caption>
            <text>
               <p>Genomic mappings for 268,515 unique tag sequences found in nine independent human embryonic stem cell lines.</p>
            </text>
            <file name="gb-2007-8-6-r113-S2.zip">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Gene Ontology analysis of nine independent human embryonic stem cells</p>
            </caption>
            <text>
               <p>Tag counts are expressed for each GO category for the top 1,000 by tag count.</p>
            </text>
            <file name="gb-2007-8-6-r113-S3.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Statistically significant differentially expressed LongSAGE tags found between embryonic stem cells and terminally differentiated tissues</p>
            </caption>
            <text>
               <p>Statistically significant differentially expressed LongSAGE tags found between embryonic stem cells and terminally differentiated tissues.</p>
            </text>
            <file name="gb-2007-8-6-r113-S4.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>The 4,337 genes found in common across 8 undifferentiated human embryonic stem cell lines</p>
            </caption>
            <text>
               <p>The 4,337 genes found in common across 8 undifferentiated human embryonic stem cell lines.</p>
            </text>
            <file name="gb-2007-8-6-r113-S5.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>The 20,047 LongSAGE tags exclusively expressed in embryonic stem cell lines</p>
            </caption>
            <text>
               <p>The 20,047 LongSAGE tags exclusively expressed in embryonic stem cell lines.</p>
            </text>
            <file name="gb-2007-8-6-r113-S6.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>The 634 LongSAGE tags exclusively expressed in ESCs that uniquely map to the human genome at least 2 kb away from an annotated transcript</p>
            </caption>
            <text>
               <p>The 634 LongSAGE tags exclusively expressed in ESCs that uniquely map to the human genome at least 2 kb away from an annotated transcript.</p>
            </text>
            <file name="gb-2007-8-6-r113-S7.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S8">
            <title>
               <p>Additional data file 8</p>
            </title>
            <caption>
               <p>The 301 LongSAGE tags exclusively expressed in ESCs that uniquely map to species conserved regions of the human genome at least 2 kb away from an annotated transcript</p>
            </caption>
            <text>
               <p>The 301 LongSAGE tags exclusively expressed in ESCs that uniquely map to species conserved regions of the human genome at least 2 kb away from an annotated transcript.</p>
            </text>
            <file name="gb-2007-8-6-r113-S8.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S9">
            <title>
               <p>Additional data file 9</p>
            </title>
            <caption>
               <p>The 52 ESC specific transcripts identified by 5' RACE</p>
            </caption>
            <text>
               <p>The 52 ESC specific transcripts identified by 5' RACE.</p>
            </text>
            <file name="gb-2007-8-6-r113-S9.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S10">
            <title>
               <p>Additional data file 10</p>
            </title>
            <caption>
               <p>RACE and qPCR primer sequences used in this study</p>
            </caption>
            <text>
               <p>RACE and qPCR primer sequences used in this study.</p>
            </text>
            <file name="gb-2007-8-6-r113-S10.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We are grateful to MF Pera (Monash Institute of Medical Research, Monash University and the Australian Stem Cell Center, Clayton, Victoria, Australia), MT Firpo (Department of Obstetrics, Gynecology and Reproductive Sciences, University of California San Francisco, San Francisco, CA) and BresaGen Inc. (Athens, GA), for providing human ESC RNA samples. This project was supported by funds from the National Cancer Institute, National Institutes of Health, under Contract No. N01-C0-12400 and by grants from Genome Canada, Genome British Columbia and the Canadian Stem Cell Network to MAM and CE. MAM is a Scholar of the Michael Smith Foundation for Health Research and is a Terry Fox Young Investigator of the National Cancer Institute of Canada. The content of this publication does not necessarily reflect the views or policies of the US Department of Health and Human Services, nor does mention of trade names, commercial products, or organization imply endorsement by the US Government.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Establishment in culture of pluripotential cells from mouse embryos.</p>
            </title>
            <aug>
               <au>
                  <snm>Evans</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Kaufman</snm>
                  <fnm>MH</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>1981</pubdate>
            <volume>292</volume>
            <fpage>154</fpage>
            <lpage>156</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/292154a0</pubid>
                  <pubid idtype="pmpid">7242681</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Embryonic stem cell lines derived from human blastocysts.</p>
            </title>
            <aug>
               <au>
                  <snm>Thomson</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Itskovitz-Eldor</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Shapiro</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Waknitz</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Swiergiel</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Marshall</snm>
                  <fnm>VS</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1998</pubdate>
            <volume>282</volume>
            <fpage>1145</fpage>
            <lpage>1147</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.282.5391.1145</pubid>
                  <pubid idtype="pmpid" link="fulltext">9804556</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Octamer binding proteins confer transcriptional activity in early mouse embryogenesis.</p>
            </title>
            <aug>
               <au>
                  <snm>Scholer</snm>
                  <fnm>HR</fnm>
               </au>
               <au>
                  <snm>Balling</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hatzopoulos</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gruss</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>EMBO J</source>
            <pubdate>1989</pubdate>
            <volume>8</volume>
            <fpage>2551</fpage>
            <lpage>2557</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">401254</pubid>
                  <pubid idtype="pmpid">2573524</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>The homeoprotein Nanog is required for maintenance of pluripotency in mouse epiblast and ES cells.</p>
            </title>
            <aug>
               <au>
                  <snm>Mitsui</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Tokuzawa</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Itoh</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Segawa</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Murakami</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Takahashi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Maruyama</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Maeda</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Yamanaka</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2003</pubdate>
            <volume>113</volume>
            <fpage>631</fpage>
            <lpage>642</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(03)00393-3</pubid>
                  <pubid idtype="pmpid" link="fulltext">12787504</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Functional expression cloning of Nanog, a pluripotency sustaining factor in embryonic stem cells.</p>
            </title>
            <aug>
               <au>
                  <snm>Chambers</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Colby</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Robertson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nichols</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tweedie</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2003</pubdate>
            <volume>113</volume>
            <fpage>643</fpage>
            <lpage>655</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(03)00392-1</pubid>
                  <pubid idtype="pmpid" link="fulltext">12787505</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Multipotent cell lineages in early mouse development depend on SOX2 function.</p>
            </title>
            <aug>
               <au>
                  <snm>Avilion</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Nicolis</snm>
                  <fnm>SK</fnm>
               </au>
               <au>
                  <snm>Pevny</snm>
                  <fnm>LH</fnm>
               </au>
               <au>
                  <snm>Perez</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Vivian</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Lovell-Badge</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>2003</pubdate>
            <volume>17</volume>
            <fpage>126</fpage>
            <lpage>140</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">195970</pubid>
                  <pubid idtype="pmpid" link="fulltext">12514105</pubid>
                  <pubid idtype="doi">10.1101/gad.224503</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Genesis, a winged helix transcriptional repressor with expression restricted to embryonic stem cells.</p>
            </title>
            <aug>
               <au>
                  <snm>Sutton</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Costa</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Klug</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Field</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Largaespada</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Fletcher</snm>
                  <fnm>CF</fnm>
               </au>
               <au>
                  <snm>Jenkins</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Copeland</snm>
                  <fnm>NG</fnm>
               </au>
               <au>
                  <snm>Klemsz</snm>
                  <fnm>M</fnm>
               </au>
               <etal/>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>1996</pubdate>
            <volume>271</volume>
            <fpage>23126</fpage>
            <lpage>23133</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.271.38.23126</pubid>
                  <pubid idtype="pmpid" link="fulltext">8798505</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Inactivation of the FGF-4 gene in embryonic stem cells alters the growth and/or the survival of their early differentiated progeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Wilder</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Kelly</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Brigman</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Nowling</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>QS</fnm>
               </au>
               <au>
                  <snm>McComb</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Capecchi</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Rizzino</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Dev Biol</source>
            <pubdate>1997</pubdate>
            <volume>192</volume>
            <fpage>614</fpage>
            <lpage>629</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/dbio.1997.8777</pubid>
                  <pubid idtype="pmpid" link="fulltext">9441693</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Developmental-specific activity of the FGF-4 enhancer requires the synergistic action of Sox2 and Oct-3.</p>
            </title>
            <aug>
               <au>
                  <snm>Yuan</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Corbi</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Basilico</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Dailey</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>1995</pubdate>
            <volume>9</volume>
            <fpage>2635</fpage>
            <lpage>2645</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gad.9.21.2635</pubid>
                  <pubid idtype="pmpid" link="fulltext">7590241</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>BMP4 initiates human embryonic stem cell differentiation to trophoblast.</p>
            </title>
            <aug>
               <au>
                  <snm>Xu</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Addicks</snm>
                  <fnm>GC</fnm>
               </au>
               <au>
                  <snm>Glennon</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Zwaka</snm>
                  <fnm>TP</fnm>
               </au>
               <au>
                  <snm>Thomson</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Nat Biotech</source>
            <pubdate>2002</pubdate>
            <volume>20</volume>
            <fpage>1261</fpage>
            <lpage>1264</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1038/nbt761</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Human embryonic stem cell and embryonic germ cell lines.</p>
            </title>
            <aug>
               <au>
                  <snm>Thomson</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Odorico</snm>
                  <fnm>JS</fnm>
               </au>
            </aug>
            <source>Trends Biotechnol</source>
            <pubdate>2000</pubdate>
            <volume>18</volume>
            <fpage>53</fpage>
            <lpage>57</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0167-7799(99)01410-9</pubid>
                  <pubid idtype="pmpid" link="fulltext">10652509</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Maintenance of pluripotency in human and mouse embryonic stem cells through activation of Wnt signaling by a pharmacological GSK-3-specific inhibitor.</p>
            </title>
            <aug>
               <au>
                  <snm>Sato</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Meijer</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Skaltsounis</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Greengard</snm>