<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2007-8-10-r214</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>MicroRNA expression profiling of human breast cancer identifies new markers of tumor subtype</p>
         </title>
         <aug>
            <au id="A1" ce="yes">
               <snm>Blenkiron</snm>
               <fnm>Cherie</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>cb391@cam.ac.uk</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Goldstein</snm>
               <mi>D</mi>
               <fnm>Leonard</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I5"/>
               <email>ldg21@cam.ac.uk</email>
            </au>
            <au id="A3">
               <snm>Thorne</snm>
               <mi>P</mi>
               <fnm>Natalie</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I5"/>
               <email>npt22@cam.ac.uk</email>
            </au>
            <au id="A4">
               <snm>Spiteri</snm>
               <fnm>Inmaculada</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>Inma.Spiteri@cancer.org.uk</email>
            </au>
            <au id="A5">
               <snm>Chin</snm>
               <fnm>Suet-Feung</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>Suet-Feung.Chin@cancer.org.uk</email>
            </au>
            <au id="A6">
               <snm>Dunning</snm>
               <mi>J</mi>
               <fnm>Mark</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>md392@cam.ac.uk</email>
            </au>
            <au id="A7">
               <snm>Barbosa-Morais</snm>
               <mi>L</mi>
               <fnm>Nuno</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>nlbmb2@cam.ac.uk</email>
            </au>
            <au id="A8">
               <snm>Teschendorff</snm>
               <mi>E</mi>
               <fnm>Andrew</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>aet21@cam.ac.uk</email>
            </au>
            <au id="A9">
               <snm>Green</snm>
               <mi>R</mi>
               <fnm>Andrew</fnm>
               <insr iid="I6"/>
               <email>andrew.green@nottingham.ac.uk</email>
            </au>
            <au id="A10">
               <snm>Ellis</snm>
               <mi>O</mi>
               <fnm>Ian</fnm>
               <insr iid="I6"/>
               <email>ian.ellis@nottingham.ac.uk</email>
            </au>
            <au id="A11">
               <snm>Tavar&#233;</snm>
               <fnm>Simon</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I5"/>
               <email>Simon.Tavare@cancer.org.uk</email>
            </au>
            <au id="A12" ca="yes">
               <snm>Caldas</snm>
               <fnm>Carlos</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>cc234@cam.ac.uk</email>
            </au>
            <au id="A13" ca="yes">
               <snm>Miska</snm>
               <mi>A</mi>
               <fnm>Eric</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>eam29@cam.ac.uk</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Cancer Research UK, Cambridge Research Institute, Li Ka-Shing Centre, Robinson Way, Cambridge CB2 0RE, UK</p>
            </ins>
            <ins id="I2">
               <p>Department of Oncology, University of Cambridge, Hills Road, Cambridge CB2 2XZ, UK</p>
            </ins>
            <ins id="I3">
               <p>Wellcome Trust/Cancer Research UK Gurdon Institute, University of Cambridge, The Henry Wellcome Building of Cancer and Developmental Biology, Tennis Court Rd, Cambridge CB2 1QN, UK</p>
            </ins>
            <ins id="I4">
               <p>Department of Biochemistry, University of Cambridge, Tennis Court Rd, Cambridge CB2 1GA, UK</p>
            </ins>
            <ins id="I5">
               <p>Department of Applied Mathematics and Theoretical Physics, University of Cambridge, Centre for Mathematical Sciences, Wilberforce Road, Cambridge CB3 0WA, UK</p>
            </ins>
            <ins id="I6">
               <p>Department of Histopathology, School of Molecular Medical Sciences, University of Nottingham, Nottingham NG5 1PB, UK</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>10</issue>
         <fpage>R214</fpage>
         <url>http://genomebiology.com/2007/8/10/R214</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17922911</pubid>
               <pubid idtype="doi">10.1186/gb-2007-8-10-r214</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>5</day>
               <month>6</month>
               <year>2007</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>22</day>
               <month>8</month>
               <year>2007</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>8</day>
               <month>10</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>08</day>
               <month>10</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Blenkiron et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>microRNA expression profiling of human breast cancer</p>
      </shorttitle>
      <shortabs>
         <p>Integrated analysis of miRNA expression and genomic changes in human breast tumors allows the classification of tumor subtypes.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>MicroRNAs (miRNAs), a class of short non-coding RNAs found in many plants and animals, often act post-transcriptionally to inhibit gene expression.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Here we report the analysis of miRNA expression in 93 primary human breast tumors, using a bead-based flow cytometric miRNA expression profiling method. Of 309 human miRNAs assayed, we identify 133 miRNAs expressed in human breast and breast tumors. We used mRNA expression profiling to classify the breast tumors as luminal A, luminal B, basal-like, HER2+ and normal-like. A number of miRNAs are differentially expressed between these molecular tumor subtypes and individual miRNAs are associated with clinicopathological factors. Furthermore, we find that miRNAs could classify basal versus luminal tumor subtypes in an independent data set. In some cases, changes in miRNA expression correlate with genomic loss or gain; in others, changes in miRNA expression are likely due to changes in primary transcription and or miRNA biogenesis. Finally, the expression of <it>DICER1 </it>and <it>AGO2 </it>is correlated with tumor subtype and may explain some of the changes in miRNA expression observed.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>This study represents the first integrated analysis of miRNA expression, mRNA expression and genomic changes in human breast cancer and may serve as a basis for functional studies of the role of miRNAs in the etiology of breast cancer. Furthermore, we demonstrate that bead-based flow cytometric miRNA expression profiling might be a suitable platform to classify breast cancer into prognostic molecular subtypes.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010003">Cancer</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010009">Genetics</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010012">Medicine</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>MicroRNAs (miRNAs) were discovered in <it>Caenorhabditis elegans </it>during studies of the control of developmental timing <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>. miRNAs are approximately 22-nucleotide non-coding RNAs that are thought to regulate gene expression through sequence-specific base-pairing with target mRNAs <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. To date, thousands of miRNAs have been identified in organisms as diverse as roundworms, flies, fish, frogs, mammals, flowering plants, mosses, and even viruses, using genetics, molecular cloning and predictions from bioinformatics <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>. The human genome encodes at least 474 miRNA genes <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>.</p>
         <p>miRNAs are transcribed as long RNA precursors (pri-miRNAs), which are processed in the nucleus by the RNase III enzyme complex Drosha-Pasha/DGCR8 to form the approximately 70-base pre-miRNAs <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp>. Pre-miRNAs are exported from the nucleus by Exportin-5 <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>, processed by the RNase III enzyme Dicer, and incorporated into an Argonaute-containing RNA-induced silencing complex (RISC) <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Within the silencing complex, miRNAs pair to the messages of protein-coding genes, usually through imperfect base-pairing with the 3'-untranslated region (3'UTR), thereby specifying the post-transcriptional repression of these target mRNAs <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B26">26</abbr></abbrgrp>. Binding of the silencing complex causes translational repression <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr></abbrgrp> and/or mRNA destabilization, which is sometimes through direct mRNA cleavage <abbrgrp><abbr bid="B30">30</abbr><abbr bid="B31">31</abbr></abbrgrp> but usually through other mechanisms <abbrgrp><abbr bid="B32">32</abbr><abbr bid="B33">33</abbr><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr></abbrgrp>.</p>
         <p>The function of human miRNAs is largely unknown. However, studies in roundworms, flies, fish and mice have demonstrated important roles for miRNAs in animal development <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. miRNA target predictions suggest important roles for miRNAs in humans. Because many mRNAs have been under selective pressure to preserve pairing to a six nucleotide sequence in the 5' region of the miRNA known as the miRNA seed (nucleotides 2-7), targets of metazoan miRNAs can be predicted by searching for conserved matches to the seed region <abbrgrp><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr><abbr bid="B40">40</abbr><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. In humans, at least 10% of the protein-coding mRNAs might be conserved targets of miRNAs <abbrgrp><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr><abbr bid="B43">43</abbr><abbr bid="B44">44</abbr><abbr bid="B45">45</abbr><abbr bid="B46">46</abbr><abbr bid="B47">47</abbr><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr></abbrgrp>.</p>
         <p>Despite their recent discovery, strong links between miRNAs and human cancer are emerging. Initial observations in roundworms and flies suggested possible connections between miRNAs and proliferation defects <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. More recently, it was shown that the human miRNAs miR-15a and miR-16-1 map to a region on 13q14 that is often deleted in B-cell chronic lymphocytic leukemias (CLL) and that miR-15a and miR-16-1 are frequently deregulated in CLL patients <abbrgrp><abbr bid="B51">51</abbr></abbrgrp>. A second study found that miR-143 and miR-145 expression levels were reduced in adenomatous and cancer stages of colorectal neoplasia <abbrgrp><abbr bid="B52">52</abbr></abbrgrp>. Subsequently, a number of studies, using a range of techniques, including miRNA cloning, quantitative PCR, microarrays and bead-based flow cytometric miRNA expression profiling <abbrgrp><abbr bid="B53">53</abbr><abbr bid="B54">54</abbr><abbr bid="B55">55</abbr><abbr bid="B56">56</abbr></abbrgrp>, demonstrated that miRNA expression is deregulated in many human cancers.</p>
         <p>A number of miRNAs were found to have oncogenic potential. For example, the <it>mir-17 </it>miRNA cluster cooperates with the oncogene <it>Myc </it>to induce tumors in a mouse model <abbrgrp><abbr bid="B57">57</abbr></abbrgrp> and miR-372 and miR-373 were found to cooperate with <it>RAS </it>in an <it>in vitro </it>assay <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. miRNAs might also act as tumor suppressors. For example, deregulation of the oncogene <it>RAS </it>and <it>HMGA2 </it>by loss of regulation through the <it>let-7 </it>family of miRNAs might contribute to human cancer <abbrgrp><abbr bid="B59">59</abbr><abbr bid="B60">60</abbr><abbr bid="B61">61</abbr></abbrgrp>. It is unclear how miRNAs might be deregulated in cancer; however, it has been observed that many human miRNAs lie within cancer associated genomic regions, that is, areas of loss, gain or rearrangement of the DNA in tumors <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>. However, transcriptional or post-transcriptional regulation of miRNAs in cancer has also been proposed <abbrgrp><abbr bid="B63">63</abbr><abbr bid="B64">64</abbr></abbrgrp>.</p>
         <p>The molecular classification of human tumors using mRNA microarray profiling is an area of intense research. A number of classifiers have been developed for human breast tumors, including the use of expression signatures as prognostic tools <abbrgrp><abbr bid="B65">65</abbr><abbr bid="B66">66</abbr><abbr bid="B67">67</abbr><abbr bid="B68">68</abbr><abbr bid="B69">69</abbr><abbr bid="B70">70</abbr><abbr bid="B71">71</abbr><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr><abbr bid="B74">74</abbr><abbr bid="B75">75</abbr></abbrgrp>. One of these classifiers can be used as a single sample predictor (SSP) to assign individual samples to one of five breast tumor subtypes: luminal A, luminal B, basal-like, HER2+ and normal breast-like <abbrgrp><abbr bid="B65">65</abbr><abbr bid="B69">69</abbr><abbr bid="B70">70</abbr><abbr bid="B76">76</abbr></abbrgrp>.</p>
         <p>Two recent studies have shown that a number of miRNAs are deregulated in human breast cancer <abbrgrp><abbr bid="B77">77</abbr><abbr bid="B78">78</abbr></abbrgrp>. A third study found that a number of miRNAs were differentially expressed in breast tumor biopsies and that miRNA expression correlated with HER2 and estrogen receptor (ER) status <abbrgrp><abbr bid="B79">79</abbr></abbrgrp>.</p>
         <p>This study represents the first integrated analysis of miRNA expression, mRNA expression and genomic changes in human breast cancer and may serve as a basis for functional studies of the role of miRNAs in the etiology of breast cancer. Furthermore, we demonstrate that bead-based flow cytometric miRNA expression profiling might be a suitable platform to classify breast cancer into prognostic molecular subtypes. This potential will need to be addressed in a prospective study.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>There are 133 miRNAs expressed in normal human breast and primary human breast cancer</p>
            </st>
            <p>To generate a comprehensive set of miRNA expression profiles for primary human breast cancer we selected 99 primary human tumors, 5 normal breast samples and 33 breast cancer cell lines for miRNA expression profiling. Tumor samples were fresh-frozen and collected from Nottingham City Hospital Tumor Bank and are representative with regard to tumor subtypes and clinical parameters <abbrgrp><abbr bid="B80">80</abbr><abbr bid="B81">81</abbr><abbr bid="B82">82</abbr></abbrgrp>. For miRNA profiling we chose a bead-based flow-cytometric miRNA expression platform, which has recently been developed and was found to have several advantages over glass-slide microarray profiling, including increased specificity <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. We developed this platform further to include 333 probes for 309 unique human miRNAs based on the miRNA repository miRBase 8.1 <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>. miRNA labeling included RNA size selection using native polyacrylamide gels, ensuring that only mature miRNAs were assayed.</p>
            <p>Using this miRNA expression platform we analyzed a total of 137 samples in 168 assays. Assays for 119 of these 137 samples (87%) passed our quality control, including 93 primary tumor samples, 5 normal breast samples and 21 cell lines (Additional data file 1). We detected the expression of 137 miRNAs in this sample set, 133 of which we detected in normal breast or breast tumors. We included a number of replicate probes and technical replicate samples and found that results were reproducible (Additional data files 5 and 6). For a subset of miRNAs and a subset of samples we also performed quantitative RT-PCR to independently assess miRNA expression (Additional data file 7). While there is generally good correlation between miRNA expression on both platforms, we do observe probe-specific differences. Sample quantity did not permit validation of miRNA expression using northern blotting; however, the bead-based flow-cytometric miRNA expression platform had been validated using northern blotting previously <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>.</p>
            <p>Unsupervised hierarchical clustering of miRNA expression clearly separated cell lines from both normal breast and tumor samples and suggested that miRNA expression in cell lines is largely deregulated (Figure <figr fid="F1">1a</figr>). We did not observe a perfect separation of normal and tumor samples, as has been described before for primary human tumors <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. However, as our study was focused on tumor subtypes, we profiled only a small number of normal breast samples. As we found major differences in miRNA expression between primary human tissue and cell lines, we excluded cell lines from subsequent analyses. Unsupervised clustering of the tumor samples revealed striking differences in miRNA expression between ER- and ER+ tumors (Figure <figr fid="F1">1b</figr>).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Unsupervised hierarchical clustering (Pearson correlation, average linkage) over 137 detected miRNAs</p>
               </caption>
               <text>
                  <p>Unsupervised hierarchical clustering (Pearson correlation, average linkage) over 137 detected miRNAs. Heatmap colors represent relative miRNA expression as indicated in the color key. <b>(a) </b>Clustering of 21 cell lines (orange), 5 normal breast samples (green) and 93 primary tumors (blue). <b>(b) </b>Clustering of 93 primary tumors with ER status as shown.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-1"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>MicroRNAs are differentially expressed between molecular breast tumor subtypes with clinical implications</p>
            </st>
            <p>Next we tested if miRNAs are differentially expressed among breast cancer subtypes. To identify the molecular subtypes of our tumor samples we used a single sample predictor (SSP), which classifies breast tumors into five subtypes: luminal A, luminal B, basal-like, HER2+ and normal-like <abbrgrp><abbr bid="B65">65</abbr><abbr bid="B69">69</abbr><abbr bid="B70">70</abbr><abbr bid="B76">76</abbr></abbrgrp>. In addition to differences in mRNA expression profiles, these tumor subtypes also display distinct clinicopathological characteristics, including different survival rates (Additional data files 8 and 9). For example, the basal-like and HER2+ tumors are less differentiated and more aggressive and the luminal A and luminal B tumors are mostly ER+ with good and poor clinical outcome, respectively. Based on Agilent and Illumina mRNA expression data for 86 of our tumor samples <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> (unpublished results) we were able to classify 51 of the 93 tumor samples as 16 basal-like, 15 luminal A, 9 luminal B, 5 HER2+ and 6 normal-like tumors (Additional data file 1). miRNAs that were found to be differentially expressed in the tumor subtypes are shown in Figure <figr fid="F2">2a,b</figr>. miRNAs that are part of the same family show highly correlated expression. For example, the nine miRNAs that were found to be differentially expressed between luminal A and luminal B tumors represent seven miRNA families (Figure <figr fid="F2">2b</figr>).</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Supervised hierarchical clustering over selected miRNAs (Pearson correlation, average linkage)</p>
               </caption>
               <text>
                  <p>Supervised hierarchical clustering over selected miRNAs (Pearson correlation, average linkage). Heatmap colors represent relative miRNA expression as indicated in the color key for each panel. Brackets in the right margin indicate members of the same miRNA family. <b>(a) </b>Clustering of 51 tumor samples that could be classified as basal-like (red), HER2+ (pink), luminal A (dark blue), luminal B (light blue) or normal-like (green) over 38 miRNAs with Benjamini-Hochberg adjusted Kruskal-Wallis <it>p </it>&lt; 0.05. <b>(b) </b>Clustering of 24 tumor samples classified as luminal A (dark blue) or luminal B (light blue) over 9 miRNAs with Benjamini-Hochberg adjusted Wilcoxon <it>p </it>&lt; 0.05.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-2"/>
            </fig>
            <p>Given the large number of miRNAs differentially expressed between molecular subtypes, we investigated the predictive potential of miRNAs in an independent test set. Using all 137 expressed miRNAs, we performed a model-based discriminant analysis <abbrgrp><abbr bid="B84">84</abbr></abbrgrp> for the 16 basal-like and 15 luminal A tumors, the two largest subtype groups in our study (Additional data file 1). As we aimed to distinguish between molecular subtypes, we required a test set of samples with both miRNA and mRNA expression data available. The bead-based miRNA expression data in Lu <it>et al</it>. <abbrgrp><abbr bid="B56">56</abbr></abbrgrp> included 11 breast tumor samples with corresponding Affymetrix gene expression data published in <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B85">85</abbr></abbrgrp>. To our knowledge, no other studies with miRNA and mRNA data on breast tumor samples have been published. Based on the gene expression profiles and the SSP, six tumor samples could be assigned to molecular subtypes, three of which were classified as basal-like, two as luminal A and one as HER2+ (Additional data files 1, 14 and 19). Using the discriminator derived from our miRNA data, all three basal-like and two luminal A tumors in the independent miRNA data set were classified in concordance with their SSP molecular subtype classification.</p>
         </sec>
         <sec>
            <st>
               <p>A number of miRNAs are associated with clinicopathological factors</p>
            </st>
            <p>We next assessed associations between individual miRNAs, molecular tumor subtypes and clinicopathological factors (Figure <figr fid="F3">3</figr> and Additional data file 18). We tested for statistically significant associations with tumor characteristics such as molecular subtype, grade, stage, vascular invasion, ER status, Nottingham Prognostic Index (NPI) as well as TP53 status as determined by mutation screening and HER2 status assessed by immunohistochemistry (unpublished results). Figure <figr fid="F3">3</figr> summarizes data for those 31 miRNAs and clinical factors for which there are significant associations at an adjusted <it>p </it>value less than 0.01 (Materials and methods). These 31 miRNAs represent 20 distinct miRNA families. Most of these miRNAs are expressed in the less aggressive, grade 1, ER+ samples. However, some miRNAs are expressed in the more aggressive grade 3/ER- tumors. We did not find any strong associations with stage, vascular invasion, NPI, TP53 or HER2 status.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Association of individual miRNAs and tumor subtype or clinicopathological factors</p>
               </caption>
               <text>
                  <p>Association of individual miRNAs and tumor subtype or clinicopathological factors. Shown are 31 miRNAs and three factors with at least one association at adjusted <it>p </it>&lt; 0.01. Differential expression was assessed by a non-parametric Wilcoxon rank sum test for comparison between two groups or a non-parametric Kruskal-Wallis test for comparison between multiple groups. To address the issue of multiple testing for the same factor, <it>p </it>values were adjusted by Benjamini and Hochberg's method [102]. Heatmap colors represent relative miRNA expression as shown in the color key. The expression values for a given sample group of interest were summarized by their mean. Brackets in the left margin indicate members of the same miRNA family. Significance levels are shown in the right margins: * adjusted <it>p </it>&lt; 0.05; ** adjusted <it>p </it>&lt; 0.01; *** adjusted <it>p </it>&lt; 0.001. Abbreviations for subtype: B, basal-like; H, HER2+; LA, luminal A; LB, luminal B; N, normal-like.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-3"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Chromosomal loss or gain cannot explain the majority of changes in miRNA expression</p>
            </st>
            <p>Given the changes in miRNA expression we observed, it is important to ask how these changes come about. We first tested if the changes in miRNA expression are likely due to chromosomal loss, gain or amplification as inferred from array comparative genomic hybridization (CGH) data. For 82 of the 93 tumor samples we analyzed for miRNA expression, we performed array CGH analysis based on gene centric oligonucleotide microarrays <abbrgrp><abbr bid="B86">86</abbr><abbr bid="B87">87</abbr></abbrgrp>. For each miRNA locus that was identified as altered in any of the samples, we performed separate non-parametric Wilcoxon rank sum tests to assess differences in expression between samples with loss, gain or amplification compared to samples without changes.</p>
            <p>We found that in many cases expression differences could not be explained by any genome alterations detected by our array CGH data (Figure <figr fid="F4">4</figr>). The expression of 17 out of 129 mature miRNAs transcribed from genomic regions with an observed aberration correlated with genomic changes at 15 distinct chromosomal loci (<it>p </it>&lt; 0.01). For miR-33 and miR-320, we found strong associations between miRNA expression and genomic alterations (<it>p </it>&lt; 0.001), suggesting chromosomal change is a possible mechanism for mis-expression of these genes in primary human breast cancers. We also identified miRNA clusters whose changes in expression were correlated with copy number, for example, for miR-30b and miR-30d at C8q24.22 (<it>p </it>&lt; 0.001) and miR-15b and miR-16-2 at C3q26.1 (<it>p </it>&lt; 0.05).</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Association of miRNA expression and DNA copy number</p>
               </caption>
               <text>
                  <p>Association of miRNA expression and DNA copy number. miRNAs mapping to regions of genomic aberration were plotted according to chromosome and genomic location. Heatmap colors represent relative miRNA expression as shown in the color key. Expression values for samples with genomic loss (L), unaltered samples (N), samples with genomic gain (G) and amplification (A) were summarized by their mean, respectively, with numbers of samples as indicated. miRNAs transcribed from multiple loci are indicated in blue. Adjacent miRNAs not separated by a black line are less than 50 kb apart. Significance levels correspond to unadjusted <it>p </it>values obtained by a non-parametric Wilcoxon rank sum test (* <it>p </it>&lt; 0.05, ** <it>p </it>&lt; 0.01, *** <it>p </it>&lt; 0.001). Given the high dependence of the performed tests, <it>p </it>values were not adjusted for multiple testing.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-4"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Expression of clustered miRNAs is coordinated</p>
            </st>
            <p>We noticed that miRNA clusters are often expressed coordinately in our sample set. For example, miR-106b, miR-93 and miR-25 situated on C7q22.1 are highly expressed in high-grade tumors. To further examine this phenomenon, we calculated the pairwise Pearson correlation of expression between miRNAs on the same chromosome and strand. We observed an abrupt drop in correlation of miRNA expression for pairs of miRNAs that were more than 50 kb apart (Additional data file 12). These observations agree well with what has been observed earlier in human tissue samples <abbrgrp><abbr bid="B88">88</abbr></abbrgrp>. We therefore used a distance of 50 kb as a cut-off to identify 56 intergenic or gene-resident spatial clusters, 44 of which are represented in the set of 137 miRNAs detected in our sample set. Interestingly, 26 of 31 clusters for which expression data from multiple stem-loop regions were available show correlated expression with r > 0.4 (Figure <figr fid="F5">5</figr> and Additional data file 13). For example, the miR-15 and miR-16 family are expressed from two clusters at chromosomes 3q and 13q, which are both highly correlated (r > 0.8). In many cases these correlations are likely due to shared regulatory elements or polycistronic expression of several miRNAs from a single primary transcript <abbrgrp><abbr bid="B88">88</abbr></abbrgrp>.</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Expression of clustered miRNAs is coordinated</p>
               </caption>
               <text>
                  <p>Expression of clustered miRNAs is coordinated. Shown are pairwise scatter plots of expression values for mature miRNAs transcribed from genomic regions within 50 kb of each other. <b>(a) </b>miR-15a, miR-15b and miR-16 transcribed from two intronic clusters at C3q26.1 (<it>SMC4L1</it>) and C13q14.3 (<it>DLEU2</it>). <b>(b) </b>miR-25, miR-93 and miR-106b transcribed from an intronic cluster at C7q22.1 (<it>MCM7</it>). <b>(c) </b>miR-199a, miR-199a*, miR-199b and miR-214 transcribed from one intergenic cluster at C1q24.3 and two intergenic stem-loops at C9q34.11 and C19p13.2. Pearson correlation coefficients (r) and data points shown are based on samples with available array CGH data and no identified genomic loss or gain at the relevant locus (Additional data file 1). Genome plots are drawn to scale as shown in the legend (bottom right), except where missing regions are indicated by vertical bars. Positive and negative strands are depicted by the top and bottom plots, respectively. Gene loci and miRNA stem-loop regions are colored in blue and red, respectively. The location of exons is marked by greater line width.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-5"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>A number of miRNA genes are co-regulated as part of larger domains</p>
            </st>
            <p>Since only 17 of the 137 miRNAs expressed in our samples showed changes in their expression associated with detected chromosomal abnormalities, changes in miRNA expression may be due to changes in transcription of primary miRNA transcripts. We showed above that miRNA clusters are expressed coordinately. We therefore asked if expression levels of miRNAs that are intronic are correlated with the expression of their host gene, as this suggests changes in primary transcription rates. To test this hypothesis, we compared miRNA expression data with Illumina mRNA expression data for our tumor sample set (unpublished results; Additional data file 13). We only detected correlations for seven miRNA host gene pairs (r > 0.4), suggesting that changes in miRNA expression in our tumor sample set are not generally linked to host gene expression (Table <tblr tid="T1">1</tblr>). These seven miRNA host gene pairs were miR-30e-5p/<it>NFYC</it>, miR-149/<it>GPC1</it>, miR-25/93/106b/<it>MCM7</it>, miR-342/<it>EVL </it>and miR-99a/<it>C21orf34</it>.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>MicroRNA/proximal probe correlations</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Host gene</p>
                     </c>
                     <c cspan="3" ca="center">
                        <p>Proximal probe</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miRNA</p>
                     </c>
                     <c ca="left">
                        <p>Chromosome position</p>
                     </c>
                     <c ca="left">
                        <p>Name</p>
                     </c>
                     <c ca="right">
                        <p>Pearson correlation</p>
                     </c>
                     <c ca="left">
                        <p>Name<sup>&#8224;</sup></p>
                     </c>
                     <c ca="right">
                        <p>Pearson correlation</p>
                     </c>
                     <c ca="right">
                        <p>miRNA/probe distance (kb)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-101</p>
                     </c>
                     <c ca="left">
                        <p>1p31.1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>FLJ26232</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4337</p>
                     </c>
                     <c ca="right">
                        <p>35.99</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-30e-5p</p>
                     </c>
                     <c ca="left">
                        <p>1p34.2</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>NFYC</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.4950</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>17.02</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-181a</p>
                     </c>
                     <c ca="left">
                        <p>1q31.3</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>Hs.497310</p>
                     </c>
                     <c ca="center">
                        <p>0.4106</p>
                     </c>
                     <c ca="right">
                        <p>19.61</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-205</p>
                     </c>
                     <c ca="left">
                        <p>1q32.2</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>NPC-A-5</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.7936</p>
                     </c>
                     <c ca="right">
                        <p>0.00</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-10b</p>
                     </c>
                     <c ca="left">
                        <p>2q31.1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXD10</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4902</p>
                     </c>
                     <c ca="right">
                        <p>30.96</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXD8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4472</p>
                     </c>
                     <c ca="right">
                        <p>18.53</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-149</p>
                     </c>
                     <c ca="left">
                        <p>2q37.3</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>GPC1</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.6567</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>11.68</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-30a-3p</p>
                     </c>
                     <c ca="left">
                        <p>6q13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>BC040204</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.6406</p>
                     </c>
                     <c ca="right">
                        <p>16.17</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-30a-5p</p>
                     </c>
                     <c ca="left">
                        <p>6q13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>BC040204</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.7091</p>
                     </c>
                     <c ca="right">
                        <p>16.17</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>C6orf155</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4995</p>
                     </c>
                     <c ca="right">
                        <p>11.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-30c</p>
                     </c>
                     <c ca="left">
                        <p>6q13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>BC040204</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4566</p>
                     </c>
                     <c ca="right">
                        <p>10.30</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-106b</p>
                     </c>
                     <c ca="left">
                        <p>7q22.1</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MCM7</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.5157</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>1.02</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-25</p>
                     </c>
                     <c ca="left">
                        <p>7q22.1</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MCM7</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.4939</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>0.59</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-93</p>
                     </c>
                     <c ca="left">
                        <p>7q22.1</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MCM7</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.4988</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>0.79</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-181a</p>
                     </c>
                     <c ca="left">
                        <p>9q33.3</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>NR6A1</it>
                           <sup>&#8225;</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>R08260</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.5913</p>
                     </c>
                     <c ca="right">
                        <p>1.51</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-181b</p>
                     </c>
                     <c ca="left">
                        <p>9q33.3</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>NR6A1</it>
                           <sup>&#8225;</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>R08260</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.5634</p>
                     </c>
                     <c ca="right">
                        <p>2.78</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-196a</p>
                     </c>
                     <c ca="left">
                        <p>12q13.13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXC10</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4914</p>
                     </c>
                     <c ca="right">
                        <p>1.75</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-342</p>
                     </c>
                     <c ca="left">
                        <p>14q32.2</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>EVL</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.7208</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>34.26</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-10a</p>
                     </c>
                     <c ca="left">
                        <p>17q21.32</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>GI_30159691</p>
                     </c>
                     <c ca="center">
                        <p>0.8123</p>
                     </c>
                     <c ca="right">
                        <p>0.40</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB6</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.8085</p>
                     </c>
                     <c ca="right">
                        <p>16.10</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB5</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.7150</p>
                     </c>
                     <c ca="right">
                        <p>11.48</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB3</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.6908</p>
                     </c>
                     <c ca="right">
                        <p>29.79</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.7019</p>
                     </c>
                     <c ca="right">
                        <p>36.74</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB4</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.6856</p>
                     </c>
                     <c ca="right">
                        <p>2.90</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HOXB8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.5937</p>
                     </c>
                     <c ca="right">
                        <p>32.43</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-199a*</p>
                     </c>
                     <c ca="left">
                        <p>19p13.2</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>DNM2</it>
                           <sup>&#8225;</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>TMED1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4111</p>
                     </c>
                     <c ca="right">
                        <p>15.22</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-99a</p>
                     </c>
                     <c ca="left">
                        <p>21q21.1</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>C21orf34</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.4766</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="right">
                        <p>67.87</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>miR-155</p>
                     </c>
                     <c ca="left">
                        <p>21q21.3</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>BIC</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.4688</p>
                     </c>
                     <c ca="right">
                        <p>0.73</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>let-7a</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>22q13.31</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>FLJ27365</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.5272</p>
                     </c>
                     <c ca="right">
                        <p>1.45</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>let-7b</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>22q13.31</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>FLJ27365</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.5732</p>
                     </c>
                     <c ca="right">
                        <p>2.38</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>&#8224;</sup>Gene symbol, accession number or Illumina probe identifier. <sup>&#8225;</sup>Gene lies on the opposite strand.</p>
               </tblfn>
            </tbl>
            <p>For miRNA genes that are intergenic, we performed a similar comparison using the most proximal probes (within 50 kb) from the Illumina platform as these probes might correspond to primary miRNA transcripts (Additional data file 13). Only 23 out of 243 miRNA/proximal probe pairs at 11 distinct loci correlated in expression (r > 0.4; Table <tblr tid="T1">1</tblr>). Some of these miRNAs have proximal probes that are very close and likely represent primary miRNA transcripts. For example, miR-205 expression is highly correlated with the proximal probe for transcript <it>NPC-A-5 </it>(r > 0.75). One striking example of correlated expression of miRNAs and proximal probes was miR-10a, which is part of the <it>HOXB </it>cluster (C17q21.32), where Illumina probe data suggest the co-regulation of a region from <it>HOXB2 </it>to <it>HOXB6 </it>including miR-10a (Table <tblr tid="T1">1</tblr>).</p>
         </sec>
         <sec>
            <st>
               <p>Some changes in miRNA expression may be due to changes in miRNA biosynthesis</p>
            </st>
            <p>As genomic changes and transcriptional regulation of miRNA expression do not explain the changes in miRNA expression we observed in human breast cancers, post-transcriptional regulation of miRNA expression has to be considered. Indeed, recent studies suggested that primary miRNA processing might be deregulated in human cancer <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B89">89</abbr><abbr bid="B90">90</abbr></abbrgrp>. Therefore, we tested whether genes required for miRNA biogenesis are differentially expressed in our breast cancer samples. As we found many changes in miRNA expression across the five clinical tumor subtypes we had defined above (Figure <figr fid="F2">2</figr>), we asked whether <it>DICER1</it>, <it>DROSHA</it>, <it>DGCR8</it>, <it>AGO1</it>, <it>AGO2</it>, <it>AGO3 </it>or <it>AGO4 </it>expression differs among these subgroups. We found significant changes in the expression of <it>DICER1 </it>(<it>p </it>&lt; 0.001), which was low in the more aggressive basal-like, HER2+ and luminal B type tumors, and <it>AGO2</it>, which was high in basal-like, HER2+ and luminal B type tumors (Figure <figr fid="F6">6</figr>). We did not find significant changes in the expression of <it>DROSHA</it>, <it>DGCR8</it>, or any of the other <it>AGO </it>genes (Figure <figr fid="F6">6</figr> and Additional data file 10). We also observed significant changes in <it>AGO2</it>, <it>DICER1 </it>and <it>DROSHA </it>expression in relation to ER status, with <it>AGO2 </it>and <it>DROSHA </it>being higher and <it>DICER1 </it>lower in ER- tumor samples (Figure <figr fid="F6">6</figr>).</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Genes required for miRNA biogenesis are differentially expressed according to molecular subtype and ER status</p>
               </caption>
               <text>
                  <p>Genes required for miRNA biogenesis are differentially expressed according to molecular subtype and ER status. Shown are boxplots of Illumina log<sub>2 </sub>intensities for <b>(a) </b><it>AGO2 </it>(<it>EIF2C2</it>), <b>(b) </b><it>DICER1</it>, <b>(c) </b><it>DROSHA </it>(<it>RNASEN</it>). Data are based on 58 samples that could be classified according to molecular subtype (17 basal-like (red), 5 HER2+ (pink), 18 luminal A (dark blue), 8 luminal B (light blue), 10 normal-like (green)) and 99 samples with known ER status (31 ER- (blue), 68 ER+ (yellow)). <b>(d) </b>Boxplots of mean miRNA expression after control-based normalization. Data are based on 51 samples that could be classified according to molecular subtype (16 basal-like (red), 5 HER2+ (pink), 15 luminal A (dark blue), 9 luminal B (light blue), 6 normal-like (green)) and 93 samples with known ER status (33 ER- (blue), 60 ER+ (yellow)). Black bars indicate the median; boxes interquartile range; whiskers most extreme data points not exceeding 1.5 times the interquartile range; points outliers. <it>P </it>values are based on non-parametric Kruskal-Wallis tests for subtype and Wilcoxon rank sum tests for ER status.</p>
               </text>
               <graphic file="gb-2007-8-10-r214-6"/>
            </fig>
            <p>The observed deregulation of genes required for miRNA biogenesis may be expected to lead to global changes in miRNA expression. To further investigate this possibility, we utilized an alternative approach to between-sample normalization. For the analyses described previously, sample median centering proved advantageous in removing technical variation between samples without changing trends in differential expression (Additional data files 1 and 4). However, this method necessarily removed any global changes in miRNA expression. Using an alternative normalization based on spike-in controls, similar to the method described in <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>, we detected small differences in mean miRNA levels according to ER status with lower mean miRNA expression in ER- tumors (Figure <figr fid="F6">6d</figr>).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>Using an innovative bead-based miRNA expression profiling method we have determined the expression profile for 309 miRNAs in primary human breast cancer. We found that miRNA expression classified molecular tumor subtypes. Furthermore, a number of individual miRNAs were associated with clinicopathological factors. Changes in miRNA expression were complex and were likely due to genomic loss or gain, transcriptional and post-transcriptional regulation and changes in the expression of miRNA biogenesis enzymes. This study forms the basis for developing miRNA expression signatures as diagnostic tools for breast cancer and also furthers our understanding of the role of miRNAs in tumorigenesis.</p>
         <p>Two previous studies of miRNA expression in human breast cancer have focused on comparing normal tissues to tumor samples. Here we focused on miRNA expression analysis of a large set of primary human tumors to reveal signatures of tumor subtype. Nevertheless, we also identified 7 out of 24 miRNAs that had previously been associated with breast cancers compared to normal tissues <abbrgrp><abbr bid="B78">78</abbr></abbrgrp> (Additional data file 18). In addition, we can confirm three of 26 miRNAs that were reported in a separate study <abbrgrp><abbr bid="B77">77</abbr></abbrgrp>. Notably, one miRNA, miR-155, is differentially expressed in ER- versus ER+ tumors (Figure <figr fid="F3">3</figr>), overexpressed in breast tumors compared to normal controls <abbrgrp><abbr bid="B77">77</abbr><abbr bid="B78">78</abbr></abbrgrp> and additionally other tumor types, suggesting that this miRNA may have diagnostic potential beyond breast cancer <abbrgrp><abbr bid="B54">54</abbr><abbr bid="B91">91</abbr><abbr bid="B92">92</abbr><abbr bid="B93">93</abbr></abbrgrp>. More recently, a quantitative RT-PCR study of miRNA expression from breast cancer biopsies revealed that miRNA expression classifies ER status <abbrgrp><abbr bid="B79">79</abbr></abbrgrp>, which is in agreement with our observations (Figure <figr fid="F1">1b</figr>). Surprisingly, we found little agreement among miRNAs we identified as being associated with clinicopathological factors and miRNAs identified in this context in a previous study <abbrgrp><abbr bid="B77">77</abbr></abbrgrp>.</p>
         <p>We showed that a large number of miRNAs in our data set are associated with molecular subtypes, and we explored the predictive potential of miRNAs in an independent test set. A model-based discriminant analysis of our training set of 31 basal-like and luminal A samples resulted in the classification of 5 samples from an independent study that was in accordance with gene expression-based molecular subtype classification. Although these results are promising, the test set is too small to allow for a sensible performance assessment of the classifier. However, there are currently no other breast tumor data sets with both mRNA and miRNA expression data publicly available that would allow further validation of miRNA-based molecular subtype classification.</p>
         <p>If miRNA expression profiles classify primary breast tumor subtypes, they may prove useful as diagnostic tools in the future and this could be assessed in a prospective study. Bead-based array miRNA profiling may be particularly well suited to assay miRNA expression in large-scale diagnostic trials since it is a high-throughput and cost-effective method <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B94">94</abbr></abbrgrp>. If miRNAs prove useful for clinical breast cancer diagnosis, they have the additional advantage that, in contrast to most mRNAs, they are long-lived <it>in vivo </it><abbrgrp><abbr bid="B35">35</abbr></abbrgrp> and very stable <it>in vitro </it><abbrgrp><abbr bid="B95">95</abbr></abbrgrp>, which might be critical in a clinical setting and allow analysis of paraffin-embedded samples.</p>
         <p>We found that the differences in miRNA expression we observed are likely not due to genomic loss or gain (Figure <figr fid="F4">4</figr>). Therefore, we investigated the regulation of miRNA expression at the transcriptional and post-transcriptional level (Figure <figr fid="F5">5</figr>, Table <tblr tid="T1">1</tblr>). As previously described for normal human tissues <abbrgrp><abbr bid="B88">88</abbr></abbrgrp>, we found that the majority of miRNA clusters are co-regulated in human breast tumors. These data are also in agreement with similar observations made in human leukemia samples <abbrgrp><abbr bid="B96">96</abbr></abbrgrp> and support the hypothesis that changes in miRNA expression in human cancer may not be distinct from normal tissue-specific miRNA expression in humans. In some instances, miRNA expression also correlates with host gene expression in the case of intronic miRNAs, or with the expression of larger domains, such as the <it>HOXB </it>cluster (Table <tblr tid="T1">1</tblr> and Additional data file 13). In these instances, miRNA expression appears to be mainly under transcriptional control.</p>
         <p>However, in many cases we observe that miRNA expression is not correlated with host genes or primary miRNA transcripts, suggesting post-transcriptional regulation of miRNA expression. Regulation of miRNA expression at the level of <it>DROSHA </it>has previously been proposed for human cancer <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B90">90</abbr></abbrgrp>. We found that <it>DICER1 </it>expression is significantly downregulated in the more aggressive basal-like, HER2+ and luminal B type tumors. Interestingly, a recent study showed that downregulating <it>DICER1 </it>expression promotes tumorgenesis <it>in vitro </it>and in a mouse lung cancer model <abbrgrp><abbr bid="B97">97</abbr></abbrgrp>. Together, these data suggest that <it>DICER1 </it>deregulation might be involved in the etiology of human breast cancer. In addition, we find that the deregulation of genes in the miRNA biogenesis pathway that we observed is in agreement with a number of independent data sets <abbrgrp><abbr bid="B98">98</abbr></abbrgrp> (Additional data file 11).</p>
         <p>Although both mRNA and miRNA expression profiles were found to be informative with regard to tumor subtype, their functional relationship remains unclear. In particular, we were interested to discover if changes in miRNA expression may correlate with changes in mRNA levels of direct targets (Additional data file 1). We considered miRNA families with identical seed (nucleotides 2-7) and mRNAs with conserved seed complementarity in their 3'UTR (Targetscan 3.1) <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. A number of miRNA families showed differential expression between subtypes for their mean expression profile. We could detect only a few instances of enrichment for down- or up-regulation of predicted target mRNAs consistent with changes in miRNA expression, although previous studies of normal human tissue did observe such an enrichment <abbrgrp><abbr bid="B45">45</abbr><abbr bid="B99">99</abbr></abbrgrp>. However, these data are consistent with the hypothesis that many miRNAs act at the level of translation rather than mRNA stability.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>To date, many studies of miRNA expression in human cancer have focused only on the deregulation of miRNA expression. Here we integrated the analysis of miRNA expression, mRNA expression and DNA copy number in human breast cancer. Based on a combined analysis of miRNA and mRNA expression data we have identified a number of miRNAs that are differentially expressed between molecular tumor subtypes. In addition, we identified candidate miRNAs that are regulated at the genomic, transcriptional and likely post-transcriptional levels in breast cancer using miRNA, mRNA and array CGH data. Using mRNA expression data, we also found that the expression of genes in the miRNA biogenesis pathway is deregulated in breast cancer. We suggest that further analysis of integrated data sets might help to unravel miRNA-dependent pathways in human breast cancer.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Sample collection</p>
            </st>
            <p>Primary breast tumor specimens were obtained with appropriate ethical approval from the Nottingham Tenovus Primary Breast Cancer Series (Nottingham City Hospital Tumor Bank, Nottingham, UK). All cases were primary operable invasive breast carcinomas collected from 1990 to 1996. Clinical information, including therapy, has been published previously <abbrgrp><abbr bid="B80">80</abbr><abbr bid="B81">81</abbr><abbr bid="B82">82</abbr><abbr bid="B83">83</abbr><abbr bid="B87">87</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>RNA extraction and labeling</p>
            </st>
            <p>RNA was extracted from primary tumors and cell lines using a standard Trizol (Invitrogen, Carlsbad, CA, USA) protocol, modified by washing the final RNA pellet with 80% EtOH. Frozen tumors were sectioned on a cryostat prior to homogenization in Trizol. RNA quantity and quality were assessed by Nanodrop (Nanodrop Technologies, Wilmington, DE, USA) and Agilent 2100 bioanalyzer (Agilent Technologies, Santa Clara, CA, USA), respectively.</p>
            <p>miRNAs were extracted from 5 &#956;g of sample total RNA using denaturing PAGE. Briefly, samples were spiked with three synthetic pre-labeling control RNAs (5'<b>-</b>pCAGUCAGUCAGUCAGUCAGUCAG-3', 5'-pGACCUCCAUGUAAACGUACAA-3', 5'-pUUGCAGAUAACUGGUACAAG-3'; Dharmacon, Lafayette, CO, USA) to control for target preparation efficiency, at 3 fmoles/sample. After purification of 18-26 bp RNAs, adaptors were ligated at the 3' and 5' ends using T4 RNA ligase (Fermentas, Burlington, OT, CA), a RNA-DNA hybrid 5'-pUUUaaccgcgaattccagt-idT-3' (Dharmacon; X = RNA, x = DNA, p = phosphate, idT = inverted [3'-3' bond] deoxythymidine) was ligated to the 3' end and 5'-acggaattcctcactAAA-3' (Dharmacon) was ligated to the 5' end using T4 RNA ligase. These bi-ligated products underwent reverse transcription using an adaptor specific primer (M37, 5'-pTACTGGAATTCGCGGTTA-3') and then amplified and labeled using PCR (M37 and M33, 5'-biotin-CAACGGAATTCCTCACTAAA-3'). Amplification was performed on an Eppendorf thermal cycler at 95&#176;C for 30 s, 50&#176;C for 30 s and 72&#176;C for 40 s for 18 cycles. PCR products were precipitated without glycogen and redissolved in 66 &#956;l 1 &#215; TE buffer containing 1 &#956;l of three biotinylated post labeling controls (100 fmols each, FVR506, PTG20210, MRC677).</p>
         </sec>
         <sec>
            <st>
               <p>Bead coupling and hybridization</p>
            </st>
            <p>Oligonucleotide probes were coupled to color-coded polystyrene beads, allowing the simultaneous detection of about 90 different target oligonucleotides. To obtain expression profiles for 309 miRNAs, we created four distinct sets of bead-coupled miRNA probes. Each sample was hybridized to the four bead sets to generate a complete miRNA profile. Oligos were 5'-amino modified with a 6-carbon linker and conjugated to carboxylated xMAP beads (Luminex, Austin, TX, USA) in 96-well formats following the standard manufacturer's protocol. To generate bead set pools, 3 &#956;l of each oligo-bead conjugate was mixed into 1 ml 1.5&#215; TMAC buffer (4.5 M tetramethylammonium chloride, 0.15% sarkosyl, 75 mM Tris-HCl pH 8.0, 6 mM EDTA). Samples were hybridized in a 96-well format with two water-only blanks and at least three bead blanks containing water instead of the labeled sample for use as a background control. We included replicate probes and technical replicate samples across bead sets and sample plates, respectively, to aid quality control and data preprocessing. Hybridization was carried out overnight at 50&#176;C with 33 &#956;l of the bead pool and 15 &#956;l of labeled sample.</p>
            <p>Unbound sample was removed from beads by washing with 1 &#215; TE and re-suspending in 1&#215; TMAC buffer. SAPE, streptavidin-phycoerythrin, premium grade (Invitrogen) was added to the beads (1:100 dilution) and incubated for 10 minutes at 50&#176;C to bind to biotin moieties on the cDNA. Samples were processed on a Luminex 100 machine and median fluorescence intensity values acquired using the StarStation software (ACS, Sheffield, UK).</p>
         </sec>
         <sec>
            <st>
               <p>Computational analysis</p>
            </st>
            <sec>
               <st>
                  <p>Preprocessing</p>
               </st>
               <p>Median fluorescence intensity values smaller than a threshold of 1 were set equal to 1, and all values were transformed by taking logs (base 2). Samples with low mean expression were excluded from further analyses (Additional data files 1 and 3). To reduce noise due to absent probes, each probe was required to exceed a log<sub>2 </sub>median fluorescence intensity value of 6 in at least one sample. Systematic probe effects were median-corrected (Additional data files 1 and 2). Replicate probes were summarized by their mean profile and samples were centered to have zero median. Technical replicate samples were summarized by their mean profile. For a more detailed description of preprocessing please see Additional data file 1.</p>
            </sec>
            <sec>
               <st>
                  <p>Genomic annotation</p>
               </st>
               <p>miRNA probe sequences were matched against stem-loop sequences in miRBase (release 8.1). Genomic miRNA clusters were identified by requiring any two stem-loops on the same chromosome and strand within 50 kb to belong to the same clusters (Additional data file 16). A miRNA was defined as gene-resident if its stem-loop is completely contained in the locus of a gene transcript on the same chromosomal strand as annotated in the Known Genes and RefSeq Genes tables obtained from the UCSC Genome Browser (hg18) <abbrgrp><abbr bid="B100">100</abbr></abbrgrp> (Additional data file 17).</p>
            </sec>
            <sec>
               <st>
                  <p>Illumina gene expression data</p>
               </st>
               <p>Illumina gene expression data were processed and summarized in the Illumina BeadStudio software. Analyses of the probe level data were performed using the <it>beadarray </it>Bioconductor package <abbrgrp><abbr bid="B101">101</abbr></abbrgrp>. After quality control, between-array qspline normalization was performed for 112 arrays for 99 samples. Replicate arrays were averaged and expression values were transformed by taking logs (base 2).</p>
            </sec>
         </sec>
         <sec>
            <st>
               <p>Subtype classification</p>
            </st>
            <p>Each array in the preprocessed Illumina and Agilent <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> gene expression data set was normalized to have zero mean and standard deviation one, and each probe was centered to have zero median. An SSP annotation for Agilent probes was provided in <abbrgrp><abbr bid="B76">76</abbr></abbrgrp>. Detailed information on the SSP annotation for Illumina probes can be found in Additional data files 1 and 15. Multiple probes for the same UniGene cluster ID in either data set were summarized by their median profile. Samples were then assigned to the nearest subtype centroid as determined by Spearman correlation, requiring a minimum correlation of 0.3. Samples that could be assigned to subtypes based on both Agilent and Illumina expression profiles were classified according to the Illumina assignment (Additional data file 1).</p>
            <sec>
               <st>
                  <p>Hierarchical clustering</p>
               </st>
               <p>Prior to hierarchical clustering, miRNA profiles were standardized to have mean zero and standard deviation one. Clustering was performed with average linkage and Pearson correlation.</p>
            </sec>
            <sec>
               <st>
                  <p>Supervised analyses</p>
               </st>
               <p>Differential expression was assessed by a non-parametric Wilcoxon rank sum test for comparison between two groups or a non-parametric Kruskal-Wallis test for comparison between multiple groups. To address the issue of multiple testing for the same contrast, adjusted <it>p </it>values were obtained by Benjamini and Hochberg's method <abbrgrp><abbr bid="B102">102</abbr></abbrgrp>.</p>
               <p>
                  <b>Copy-number-driven expression</b>
               </p>
               <p>For each miRNA stem-loop identified as gained, lost or amplified in any of the samples, separate non-parametric Wilcoxon rank sum tests were performed to assess differences in expression between samples with genomic changes and unaltered samples <abbrgrp><abbr bid="B103">103</abbr></abbrgrp>. <it>P </it>values were not adjusted for multiple testing due to the high level of dependence between the performed tests.</p>
               <p>
                  <b>Coexpression of proximal miRNAs and Illumina probes</b>
               </p>
               <p>For a given chromosome and strand, pairwise Pearson correlation coefficients were calculated for all miRNA probes and those Illumina probes mapping to a host gene or within 50 kb of a miRNA stem-loop. To account for coexpression caused by DNA copy number changes, correlation coefficients for probe pairs were calculated using only those samples with available array CGH data showing no evidence for aberration at either locus (Additional data file 1).</p>
               <p>All analyses were performed in the statistical programming environment R <abbrgrp><abbr bid="B104">104</abbr></abbrgrp> using customized functions and functions available from Bioconductor <abbrgrp><abbr bid="B105">105</abbr><abbr bid="B106">106</abbr></abbrgrp> and the MCLUST package <abbrgrp><abbr bid="B107">107</abbr></abbrgrp>. All miRNA expression data have been submitted to the Gene Expression Omnibus (GEO) with accession number GSE7842.</p>
            </sec>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>CGH, comparative genomic hybridization; ER, estrogen receptor; miRNA, microRNA; NPI, Nottingham Prognostic Index; SSP, single sample predictor.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>CB, CC and EAM conceived and designed the study. ARG and IOE provided breast cancer samples and clinical information. CB, IS and SC performed the experiments under the supervision of CC and EAM. The statistical analysis and experimental design were conducted by LDG and supervised by NPT. ST and AET provided statistical advice. MD preprocessed the Illumina gene expression data. NLBM provided the Illumina probe annotation. CB, LDG, NPT, ST, CC and EAM wrote the manuscript.</p>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper. A detailed description of the computational analysis carried out is given in additional data file <supplr sid="S1">1</supplr> and a layout of the experimental design is shown in additional data file <supplr sid="S2">2</supplr>. Additional data on miRNA expression analysis can be found in additional data file <supplr sid="S3">3</supplr> (pre-processing), additional data file <supplr sid="S4">4</supplr> (normalization), additional data file <supplr sid="S5">5</supplr> (replicate probes), additional data file <supplr sid="S6">6</supplr> (replicate samples) and additional data file <supplr sid="S7">7</supplr> (qRT-PCR validation). Additional data file <supplr sid="S8">8</supplr> contains a mRNA expression heatmap for 82 classified samples and 75 intrinsic genes, and additional data file <supplr sid="S9">9</supplr> contains a pairwise comparison of Kaplan-Meier survival curves for 74 classified samples with available follow up data. Additional data on differential expression of miRNA processing genes can be found in additional data file <supplr sid="S10">10</supplr> (this data set) and additional data file <supplr sid="S11">11</supplr> (other data sets). Additional data file <supplr sid="S12">12</supplr> shows the correlation of proximal miRNA probes and additional data file <supplr sid="S13">13</supplr> shows correlations between miRNA probes and Illumina probes. Additional data file <supplr sid="S14">14</supplr> shows a model-based discriminant analysis for Basal-like and Luminal A tumors. Additional data file <supplr sid="S15">15</supplr> contains annotation for the intrinsic gene probe set (single sample predictor). Additional data file <supplr sid="S16">16</supplr> lists spatial miRNA clusters, additional data file <supplr sid="S17">17</supplr> lists host gene coordinates of intragenic miRNAs and additional data file <supplr sid="S18">18</supplr> associations between individual miRNAs, molecular tumor subtypes and clinicopathological factors. Additional data file <supplr sid="S19">19</supplr> contains the intrinsic gene probe sets used for the model-based discriminant analysis.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Supplementary Notes</p>
            </caption>
            <text>
               <p>This file contains a detailed description of the computational analyis.</p>
            </text>
            <file name="gb-2007-8-10-r214-S1.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Layout of the experimental design</p>
            </caption>
            <text>
               <p>A. Data matrix of miRNA expression values (schematic). The 333 rows and 168 columns correspond to probes and samples respectively. Expression values for each sample were obtained from hybridizations to four distinct bead sets (with approximately 90 probes each), carried out in separate wells of 96-well plates. Hybridizations were performed on eight plates, using two plates for each bead set. The allocation of samples between the two plates for a given bead set was kept consistent for all four bead sets. Thus both probes and samples could be ordered according to the plate of origin, partitioning the data matrix into eight blocks corresponding to measurements from distinct plates. Expression values for a representative well on plate 1 for beadset 1 are indicated in grey. B. Heatmap of unnormalized log<sub>2 </sub>MFI values for all miRNA probes and all samples. Probes were median centred prior to plotting. C. Heatmap of differences between the probe median for the randomized samples on a given plate and the probe median for all samples on both plates.</p>
            </text>
            <file name="gb-2007-8-10-r214-S2.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Preprocessing of miRNA expression data</p>
            </caption>
            <text>
               <p>A. Histograms of log<sub>2 </sub>MFI values obtained from wells containing sample material (white) and blank control wells (blue). B. The number of detected probes after filtering was plotted against a range of cutoff values. Probes were removed (filtered) if they did not exceed the chosen cutoff (red) in at least one sample. C, D. Sample quality control. Pearson correlation coefficients for technical replicate samples were plotted against the smaller of the two sample means for (C) cell line technical replicate samples and (D) normal and tumor technical replicate samples. The cutoff used for quality control is indicated by a vertical line. Colours corresponding to sample status are explained in the colour key. E. Technical sample effects. Pairwise differences between the medians of technical replicate samples were plotted for unnormalized data (black), data normalized based on spike-in controls (blue) and data normalized by sample median centering (red). Dashed lines indicate the maximum difference between the medians of any two samples for unnormalized data (black) and for data normalized using spike-in controls (blue).</p>
            </text>
            <file name="gb-2007-8-10-r214-S3.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Between-sample normalization</p>
            </caption>
            <text>
               <p>Between-sample normalization. A. Shown are data normalized based on spike-in controls for the same miRNAs and factors as in Figure <figr fid="F3">3</figr> in the main text. B. miRNAs and factors with at least one association at adjusted p &lt; 0.01 based on data normalized using spike-in controls. All miRNAs thus identified were also identified after sample median centering with the exception of miR-152, which was found to be associated with all three factors at p &lt; 0.05 (Additional data file 18). Heatmap colours reflect relative miRNA expression. The expression values for a given sample group of interest were summarized by their mean. Brackets in the left margin indicate members of the same miRNA family. Significance levels are indicated in the right margins: * adjusted p &lt; 0.05, ** adjusted p &lt; 0.01, *** adjusted p &lt; 0.001. Abbreviations for subtype: B = Basal-like, H = HER2+, LA = Luminal A, LB = Luminal B, N = Normal-like.</p>
            </text>
            <file name="gb-2007-8-10-r214-S4.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>Replicate probes</p>
            </caption>
            <text>
               <p>Pairwise scatter plots of replicate probes after sample quality control, probe filtering and within-plate probe correction (none of the replicated probes were removed due to probe filtering). Scatter plots for one failed probe (miR-224-4) are marked in red.</p>
            </text>
            <file name="gb-2007-8-10-r214-S5.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>Technical replicate samples</p>
            </caption>
            <text>
               <p>Pairwise scatter plots of technical replicate samples after sample quality control, probe filtering, within-plate probe correction and summarizing replicate probes.</p>
            </text>
            <file name="gb-2007-8-10-r214-S6.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>qRT-PCR validation</p>
            </caption>
            <text>
               <p>Normalized log<sub>2 </sub>MFI values were plotted against log<sub>2</sub>-transformed and median-corrected measurements obtained by qRT-PCR</p>
            </text>
            <file name="gb-2007-8-10-r214-S7.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S8">
            <title>
               <p>Additional data file 8</p>
            </title>
            <caption>
               <p>Gene expression heatmap for 82 classified samples and 75 of the 80 intrinsic genes</p>
            </caption>
            <text>
               <p>Expression values are based on Illumina data when available, and Agilent data otherwise. The two data sets were normalized as described. Missing values in the Agilent data are indicated in white. Samples were ordered according to molecular subtype (see colour key). The heatmap does not present a hierarchical clustering but merely illustrates differences in gene expression. A. Luminal/ER+ gene cluster. B. ERBB2 and GRB7-containing cluster. C. Interferon-regulated cluster including STAT1. D. Basal epithelial cluster. E. Proliferation cluster.</p>
            </text>
            <file name="gb-2007-8-10-r214-S8.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S9">
            <title>
               <p>Additional data file 9</p>
            </title>
            <caption>
               <p>Pairwise comparison of Kaplan-Meier survival curves</p>
            </caption>
            <text>
               <p>Pairwise comparison of Kaplan-Meier survival curves for 74 classified samples with available follow up data (21 Basal-like, 7 HER2+, 25 Luminal A, 10 Luminal B, 11 Normal-like). A non-parametric log rank test was used to assess differences in clinical outcome.</p>
            </text>
            <file name="gb-2007-8-10-r214-S9.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S10">
            <title>
               <p>Additional data file 10</p>
            </title>
            <caption>
               <p>miRNA processing genes show differential expression according to subtype, and ER status</p>
            </caption>
            <text>
               <p>Shown are boxplots of log<sub>2 </sub>expression for <it>DGCR8</it>, <it>DICER1</it>, <it>DROSHA </it>(<it>RNASEN</it>), <it>AGO1 </it>(<it>EIF2C1</it>), <it>AGO2 </it>(<it>EIF2C2</it>), <it>AGO3 </it>(<it>EIF2C3</it>) and <it>AGO4 </it>(<it>EIF2C4</it>). The data were obtained for 58 samples classified according to subtype (17 Basal-like, 5 HER2+, 18 Luminal A, 8 Luminal B, 10 Normal-like) and 99 samples with known ER status (31 ER-, 68 ER+). We only included Illumina probes not mapping to introns and which could be detected at log<sub>2 </sub>expression 6 in at least one sample. Differential expression was assessed using a non-parametric Kruskal-Wallis test (subtype) and Wilcoxon rank sum test (ER status).</p>
            </text>
            <file name="gb-2007-8-10-r214-S10.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S11">
            <title>
               <p>Additional data file 11</p>
            </title>
            <caption>
               <p>miRNA processing genes show differential expression according to ER status in publicly available data sets</p>
            </caption>
            <text>
               <p>Shown are boxplots of normalized gene expression units for each candidate gene that showed differential expression (Student's t-test p &lt; 0.001). Data were obtained from the cancer microarray database ONCOMINE <abbrgrp><abbr bid="B98">98</abbr></abbrgrp>, and differential expression was assessed using Student's t-test. Each row of plots corresponds to a unique gene; data obtained from different studies are separated by a solid vertical black line. For each data set the number of ER negative (blue) and ER positive (yellow) samples is included in the lower figure margin. The first authors of the relevant publications are included in the plot title.</p>
            </text>
            <file name="gb-2007-8-10-r214-S11.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S12">
            <title>
               <p>Additional data file 12</p>
            </title>
            <caption>
               <p>Correlation of proximal miRNAs</p>
            </caption>
            <text>
               <p>Pearson correlation coefficients for mature miRNAs mapping to the same chromosome and strand were plotted against decreasing ranks of pairwise distances. Diamonds represent a moving average over five correlation coefficients. The absolute distance is plotted in blue and indicated on the right y-axis. Distance 50 kb is indicated by a vertical red line.</p>
            </text>
            <file name="gb-2007-8-10-r214-S12.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S13">
            <title>
               <p>Additional data file 13</p>
            </title>
            <caption>
               <p>Correlation of miRNA and Illumina probes</p>
            </caption>
            <text>
               <p>Heatmap of Pearson correlation coefficients (accounting for DNA copy number changes as described) between miRNA probes and selected Illumina probes on the same chromosome and strand. Blank entries are due to missing DNA copy number information. Probes are arranged in genomic order. Black boxes indicate clusters of adjacent probes less than 50 kb apart. Green boxes indicate clusters of probes mapping to the same host gene. Mature miRNAs included in multiple stem-loops are indicated in blue. Relative genomic probe positions are marked as white bars on the chromosomal plot below each heatmap.</p>
            </text>
            <file name="gb-2007-8-10-r214-S13.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S14">
            <title>
               <p>Additional data file 14</p>
            </title>
            <caption>
               <p>Model-based discriminant analysis for Basal-like and Luminal A tumors</p>
            </caption>
            <text>
               <p>SSP molecular subtype classification based on the Affymetrix gene expression data for normal breast and breast tumor samples in <abbrgrp><abbr bid="B56">56</abbr><abbr bid="B85">85</abbr></abbrgrp>. Spearman correlations with the five subtype centroids are shown for all 14 samples. The solid horizontal black line indicates the minimum correlation required for subtype assignment. If the minimal correlation with a subtype centroid was achieved, the classification was made using the centroid with highest Spearman correlation. B. Shown are class posterior probabilities for 16 Basal-like and 15 Luminal A tumors in the training set (using all detected 138 miRNAs); and three Basal-like and two Luminal A tumors in the test set (using the 77 detected miRNAs in common with the training set). Red and blue indicate the posterior probability of belonging to the Basal-like and Luminal A subtype respectively. Plotting characters indicate the gene expression based subtype classification with squares and triangles representing Basal-like and Luminal A samples respectively. Samples were assigned to the class with posterior probability greater than 0.5 (solid horizontal black line).</p>
            </text>
            <file name="gb-2007-8-10-r214-S14.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S15">
            <title>
               <p>Additional data file 15</p>
            </title>
            <caption>
               <p>Intrinsic genes, probe sets (single sample predictor)</p>
            </caption>
            <text>
               <p>Intrinsic genes, probe sets (single sample predictor)</p>
            </text>
            <file name="gb-2007-8-10-r214-S15.txt">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S16">
            <title>
               <p>Additional data file 16</p>
            </title>
            <caption>
               <p>Spatial miRNA clusters</p>
            </caption>
            <text>
               <p>Spatial miRNA clusters</p>
            </text>
            <file name="gb-2007-8-10-r214-S16.txt">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S17">
            <title>
               <p>Additional data file 17</p>
            </title>
            <caption>
               <p>Host gene coordinates of intragenic miRNAs</p>
            </caption>
            <text>
               <p>Host gene coordinates of intragenic miRNAs</p>
            </text>
            <file name="gb-2007-8-10-r214-S17.txt">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S18">
            <title>
               <p>Additional data file 18</p>
            </title>
            <caption>
               <p>Associations between individual miRNAs, molecular tumor subtypes and clinicopathological factors</p>
            </caption>
            <text>
               <p>Associations between individual miRNAs, molecular tumor subtypes and clinicopathological factors</p>
            </text>
            <file name="gb-2007-8-10-r214-S18.txt">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S19">
            <title>
               <p>Additional data file 19</p>
            </title>
            <caption>
               <p>Intrinsic genes, probe sets (model-based discriminant analysis)</p>
            </caption>
            <text>
               <p>Intrinsic genes, probe sets (model-based discriminant analysis)</p>
            </text>
            <file name="gb-2007-8-10-r214-S19.txt">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>This work was funded by grants from Cancer Research UK to CC, ST and EAM. CB was supported by the UK National Translation Cancer Research Network (NTRAC) and LDG was supported by an EPSRC fellowship. ST is a Royal Society-Wolfson Research Merit Award holder. We would like to thank the Tissue Bank, City Hospital, Nottingham, UK for human breast samples. We thank Sarah Hyland for her work on the TP53 mutation screen and John Marioni for useful discussions on the analysis. We would like to thank the reviewers for exceptionally helpful comments on the manuscript.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Heterochronic mutants of the nematode <it>Caenorhabditis elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Ambros</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Horvitz</snm>
                  <fnm>HR</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1984</pubdate>
            <volume>226</volume>
            <fpage>409</fpage>
            <lpage>416</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.6494891</pubid>
                  <pubid idtype="pmpid" link="fulltext">6494891</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The <it>C. elegans </it>heterochronic gene <it>lin-4 </it>encodes small RNAs with antisense complementarity to <it>lin-14</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Feinbaum</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Ambros</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1993</pubdate>
            <volume>75</volume>
            <fpage>843</fpage>
            <lpage>854</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0092-8674(93)90529-Y</pubid>
                  <pubid idtype="pmpid" link="fulltext">8252621</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Posttranscriptional regulation of the heterochronic gene <it>lin-14 </it>by <it>lin-4 </it>mediates temporal pattern formation in <it>C. elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Wightman</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ha</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Ruvkun</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1993</pubdate>
            <volume>75</volume>
            <fpage>855</fpage>
            <lpage>862</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0092-8674(93)90530-4</pubid>
                  <pubid idtype="pmpid" link="fulltext">8252622</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>The 21-nucleotide <it>let-7 </it>RNA regulates developmental timing in <it>Caenorhabditis elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Reinhart</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Slack</snm>
                  <fnm>FJ</fnm>
               </au>
               <au>
                  <snm>Basson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pasquinelli</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Bettinger</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Rougvie</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Horvitz</snm>
                  <fnm>HR</fnm>
               </au>
               <au>
                  <snm>Ruvkun</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>403</volume>
            <fpage>901</fpage>
            <lpage>906</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35002607</pubid>
                  <pubid idtype="pmpid" link="fulltext">10706289</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Mutations that lead to reiterations in the cell lineages of <it>C. elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Chalfie</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Horvitz</snm>
                  <fnm>HR</fnm>
               </au>
               <au>
                  <snm>Sulston</snm>
                  <fnm>JE</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1981</pubdate>
            <volume>24</volume>
            <fpage>59</fpage>
            <lpage>69</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0092-8674(81)90501-8</pubid>
                  <pubid idtype="pmpid" link="fulltext">7237544</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>MicroRNAs: genomics, biogenesis, mechanism, and function.</p>
            </title>
            <aug>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2004</pubdate>
            <volume>116</volume>
            <fpage>281</fpage>
            <lpage>297</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(04)00045-5</pubid>
                  <pubid idtype="pmpid" link="fulltext">14744438</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Cloning and characterization of micro-RNAs from moss.</p>
            </title>
            <aug>
               <au>
                  <snm>Arazi</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Talmor-Neiman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Stav</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Riese</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Huijser</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Baulcombe</snm>
                  <fnm>DC</fnm>
               </au>
            </aug>
            <source>Plant J</source>
            <pubdate>2005</pubdate>
            <volume>43</volume>
            <fpage>837</fpage>
            <lpage>848</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-313X.2005.02499.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">16146523</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Antiquity of microRNAs and their targets in land plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Axtell</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2005</pubdate>
            <volume>17</volume>
            <fpage>1658</fpage>
            <lpage>1673</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1143068</pubid>
                  <pubid idtype="pmpid" link="fulltext">15849273</pubid>
                  <pubid idtype="doi">10.1105/tpc.105.032185</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Identification of novel genes coding for small expressed RNAs.</p>
            </title>
            <aug>
               <au>
                  <snm>Lagos-Quintana</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rauhut</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Lendeckel</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Tuschl</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2001</pubdate>
            <volume>294</volume>
            <fpage>853</fpage>
            <lpage>858</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1064921</pubid>
                  <pubid idtype="pmpid" link="fulltext">11679670</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>An abundant class of tiny RNAs with probable regulatory roles in <it>Caenorhabditis elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lau</snm>
                  <fnm>NC</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>LP</fnm>
               </au>
               <au>
                  <snm>Weinstein</snm>
                  <fnm>EG</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2001</pubdate>
            <volume>294</volume>
            <fpage>858</fpage>
            <lpage>862</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1065062</pubid>
                  <pubid idtype="pmpid" link="fulltext">11679671</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>An extensive class of small RNAs in <it>Caenorhabditis elegans</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Ambros</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2001</pubdate>
            <volume>294</volume>
            <fpage>862</fpage>
            <lpage>864</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1065329</pubid>
                  <pubid idtype="pmpid" link="fulltext">11679672</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Vertebrate microRNA genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Lim</snm>
                  <fnm>LP</fnm>
               </au>
               <au>
                  <snm>Glasner</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Yekta</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Burge</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2003</pubdate>
            <volume>299</volume>
            <fpage>1540</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1080372</pubid>
                  <pubid idtype="pmpid" link="fulltext">12624257</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Endogenous and silencing-associated small RNAs in plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Llave</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Kasschau</snm>
                  <fnm>KD</fnm>
               </au>
               <au>
                  <snm>Rector</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Carrington</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2002</pubdate>
            <volume>14</volume>
            <fpage>1605</fpage>
            <lpage>1619</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">150710</pubid>
                  <pubid idtype="pmpid" link="fulltext">12119378</pubid>
                  <pubid idtype="doi">10.1105/tpc.003210</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>MicroRNAs in plants.</p>
            </title>
            <aug>
               <au>
                  <snm>Reinhart</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Weinstein</snm>
                  <fnm>EG</fnm>
               </au>
               <au>
                  <snm>Rhoades</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>2002</pubdate>
            <volume>16</volume>
            <fpage>1616</fpage>
            <lpage>1626</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">186362</pubid>
                  <pubid idtype="pmpid" link="fulltext">12101121</pubid>
                  <pubid idtype="doi">10.1101/gad.1004402</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Stage-specific expression of microRNAs during Xenopus development.</p>
            </title>
            <aug>
               <au>
                  <snm>Watanabe</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Takeda</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mise</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Okuno</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Minami</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Imai</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>FEBS Lett</source>
            <pubdate>2005</pubdate>
            <volume>579</volume>
            <fpage>318</fpage>
            <lpage>324</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.febslet.2004.11.067</pubid>
                  <pubid idtype="pmpid" link="fulltext">15642338</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Identification of virus-encoded microRNAs.</p>
            </title>
            <aug>
               <au>
                  <snm>Pfeffer</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zavolan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Grasser</snm>
                  <fnm>FA</fnm>
               </au>
               <au>
                  <snm>Chien</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Russo</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Ju</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>John</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Enright</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Marks</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Sander</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Tuschl</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2004</pubdate>
            <volume>304</volume>
            <fpage>734</fpage>
            <lpage>736</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1096781</pubid>
                  <pubid idtype="pmpid" link="fulltext">15118162</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>miRBase: microRNA sequences, targets and gene nomenclature.</p>
            </title>
            <aug>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Grocock</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>van Dongen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Enright</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D140</fpage>
            <lpage>144</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347474</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381832</pubid>
                  <pubid idtype="doi">10.1093/nar/gkj112</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>The microRNA Registry.</p>
            </title>
            <aug>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>D109</fpage>
            <lpage>111</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308757</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681370</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh023</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Processing of primary microRNAs by the Microprocessor complex.</p>
            </title>
            <aug>
               <au>
                  <snm>Denli</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Tops</snm>
                  <fnm>BB</fnm>
               </au>
               <au>
                  <snm>Plasterk</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>Ketting</snm>
                  <fnm>RF</fnm>
               </au>
               <au>
                  <snm>Hannon</snm>
                  <fnm>GJ</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>432</volume>
            <fpage>231</fpage>
            <lpage>235</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03049</pubid>
                  <pubid idtype="pmpid" link="fulltext">15531879</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>The Microprocessor complex mediates the genesis of microRNAs.</p>
            </title>
            <aug>
               <au>
                  <snm>Gregory</snm>
                  <fnm>RI</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>KP</fnm>
               </au>
               <au>
                  <snm>Amuthan</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Chendrimada</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Doratotaj</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Cooch</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Shiekhattar</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>432</volume>
            <fpage>235</fpage>
            <lpage>240</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03120</pubid>
                  <pubid idtype="pmpid" link="fulltext">15531877</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>The Drosha-DGCR8 complex in primary microRNA processing.</p>
            </title>
            <aug>
               <au>
                  <snm>Han</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yeom</snm>
                  <fnm>KH</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>YK</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>VN</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>2004</pubdate>
            <volume>18</volume>
            <fpage>3016</fpage>
            <lpage>3027</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">535913</pubid>
                  <pubid idtype="pmpid" link="fulltext">15574589</pubid>
                  <pubid idtype="doi">10.1101/gad.1262504</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>The human DiGeorge syndrome critical region gene 8 and its <it>D. melanogaster </it>homolog are required for miRNA biogenesis.</p>
            </title>
            <aug>
               <au>
                  <snm>Landthaler</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Yalcin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Tuschl</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <fpage>2162</fpag