<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2009-10-4-r43</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>The bovine lactation genome: insights into the evolution of mammalian milk</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Lemay</snm>
               <mi>G</mi>
               <fnm>Danielle</fnm>
               <insr iid="I1"/>
               <email>dglemay@ucdavis.edu</email>
            </au>
            <au id="A2">
               <snm>Lynn</snm>
               <mi>J</mi>
               <fnm>David</fnm>
               <insr iid="I2"/>
               <email>david_lynn@sfu.ca</email>
            </au>
            <au id="A3">
               <snm>Martin</snm>
               <mi>F</mi>
               <fnm>William</fnm>
               <insr iid="I1"/>
               <email>wfmartin@ucdavis.edu</email>
            </au>
            <au id="A4">
               <snm>Neville</snm>
               <mi>C</mi>
               <fnm>Margaret</fnm>
               <insr iid="I3"/>
               <email>Peggy.Neville@ucdenver.edu</email>
            </au>
            <au id="A5">
               <snm>Casey</snm>
               <mi>M</mi>
               <fnm>Theresa</fnm>
               <insr iid="I4"/>
               <email>ande1218@msu.edu</email>
            </au>
            <au id="A6">
               <snm>Rincon</snm>
               <fnm>Gonzalo</fnm>
               <insr iid="I5"/>
               <email>grincon@ucdavis.edu</email>
            </au>
            <au id="A7">
               <snm>Kriventseva</snm>
               <mi>V</mi>
               <fnm>Evgenia</fnm>
               <insr iid="I6"/>
               <email>evgenia.kriventseva@isb-sib.ch</email>
            </au>
            <au id="A8">
               <snm>Barris</snm>
               <mi>C</mi>
               <fnm>Wesley</fnm>
               <insr iid="I7"/>
               <email>wes.barris@csiro.au</email>
            </au>
            <au id="A9">
               <snm>Hinrichs</snm>
               <mi>S</mi>
               <fnm>Angie</fnm>
               <insr iid="I8"/>
               <email>angie@soe.ucsc.edu</email>
            </au>
            <au id="A10">
               <snm>Molenaar</snm>
               <mi>J</mi>
               <fnm>Adrian</fnm>
               <insr iid="I9"/>
               <email>adrian.molenaar@agresearch.co.nz</email>
            </au>
            <au id="A11">
               <snm>Pollard</snm>
               <mi>S</mi>
               <fnm>Katherine</fnm>
               <insr iid="I10"/>
               <email>kpollard@gladstone.ucsf.edu</email>
            </au>
            <au id="A12">
               <snm>Maqbool</snm>
               <mi>J</mi>
               <fnm>Nauman</fnm>
               <insr iid="I11"/>
               <email>nauman.maqbool@agresearch.co.nz</email>
            </au>
            <au id="A13">
               <snm>Singh</snm>
               <fnm>Kuljeet</fnm>
               <insr iid="I9"/>
               <email>kuljeet.singh@agresearch.co.nz</email>
            </au>
            <au id="A14">
               <snm>Murney</snm>
               <fnm>Regan</fnm>
               <insr iid="I9"/>
               <email>Regan.Murney@agresearch.co.nz</email>
            </au>
            <au id="A15">
               <snm>Zdobnov</snm>
               <mi>M</mi>
               <fnm>Evgeny</fnm>
               <insr iid="I12"/>
               <insr iid="I13"/>
               <insr iid="I14"/>
               <email>zdobnov@medecine.unige.ch</email>
            </au>
            <au id="A16">
               <snm>Tellam</snm>
               <mi>L</mi>
               <fnm>Ross</fnm>
               <insr iid="I7"/>
               <email>Ross.Tellam@csiro.au</email>
            </au>
            <au id="A17">
               <snm>Medrano</snm>
               <mi>F</mi>
               <fnm>Juan</fnm>
               <insr iid="I5"/>
               <email>jfmedrano@ucdavis.edu</email>
            </au>
            <au id="A18">
               <snm>German</snm>
               <fnm>J Bruce</fnm>
               <insr iid="I1"/>
               <insr iid="I15"/>
               <email>jbgerman@ucdavis.edu</email>
            </au>
            <au id="A19">
               <snm>Rijnkels</snm>
               <fnm>Monique</fnm>
               <insr iid="I16"/>
               <email>rijnkel@bcm.tmc.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Food Science and Technology, University of California Davis, One Shields Avenue, Davis, CA 95616, USA</p>
            </ins>
            <ins id="I2">
               <p>Department of Molecular Biology and Biochemistry, Simon Fraser University, University Drive, Burnaby, BC, V5A 1S6, Canada</p>
            </ins>
            <ins id="I3">
               <p>Department of Physiology and Biophysics, University of Colorado Denver, Anschutz Medical Center, E. 19th Ave, Aurora CO 80045, USA</p>
            </ins>
            <ins id="I4">
               <p>Department of Animal Science, Michigan State University, East Lansing, MI 48824-1225, USA</p>
            </ins>
            <ins id="I5">
               <p>Department of Animal Science, University of California Davis, One Shields Avenue, Davis, CA 95616, USA</p>
            </ins>
            <ins id="I6">
               <p>Department of Structural Biology and Bioinformatics, University of Geneva Medical School, rue Michel-Servet, 1211 Geneva, Switzerland</p>
            </ins>
            <ins id="I7">
               <p>CSIRO Livestock Industries, Queensland Bioscience Precinct, Carmody Road, St Lucia, Queensland 4067, Australia</p>
            </ins>
            <ins id="I8">
               <p>Center for Biomolecular Science and Engineering, University of California Santa Cruz, High St, Santa Cruz, CA 95064, USA</p>
            </ins>
            <ins id="I9">
               <p>Dairy Science and Technology, AgResearch, Ruakura Research Centre, East Street, Hamilton, 3240, New Zealand</p>
            </ins>
            <ins id="I10">
               <p>Division of Biostatistics and Gladstone Institutes, University of California San Francisco, Owens St, San Francisco, CA 94158, USA</p>
            </ins>
            <ins id="I11">
               <p>Bioinformatics, Mathematics and Statistics, AgResearch, Invermay Agricultural Centre, Puddle Alley, Mosgiel 9053, New Zealand</p>
            </ins>
            <ins id="I12">
               <p>Department of Genetic Medicine and Development, University of Geneva Medical School, rue Michel-Servet, 1211 Geneva, Switzerland</p>
            </ins>
            <ins id="I13">
               <p>Swiss Institute of Bioinformatics, rue Michel-Servet, 1211 Geneva, Switzerland</p>
            </ins>
            <ins id="I14">
               <p>Imperial College London, South Kensington Campus, London, SW7 2AZ, UK</p>
            </ins>
            <ins id="I15">
               <p>Nestl&#233; Research Centre, Vers-chez-les-Blanc CH-1000, Lausanne 26, Switzerland</p>
            </ins>
            <ins id="I16">
               <p>Department of Pediatrics, Children's Nutrition Research Center, Baylor College of Medicine, Bates Street, Houston TX 77030, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2009</pubdate>
         <volume>10</volume>
         <issue>4</issue>
         <fpage>R43</fpage>
         <url>http://genomebiology.com/2009/10/4/R43</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">19393040</pubid>
               <pubid idtype="doi">10.1186/gb-2009-10-4-r43</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>12</day>
               <month>9</month>
               <year>2008</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>17</day>
               <month>12</month>
               <year>2008</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>24</day>
               <month>4</month>
               <year>2009</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>24</day>
               <month>4</month>
               <year>2009</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2009</year>
         <collab>Lemay et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Evolution of lactation</p>
      </shorttitle>
      <shortabs>
         <p>Comparison of milk protein and mammary genes in the bovine genome with those from other mammals gives insights into the evolution of lactation.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>The newly assembled <it>Bos taurus </it>genome sequence enables the linkage of bovine milk and lactation data with other mammalian genomes.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Using publicly available milk proteome data and mammary expressed sequence tags, 197 milk protein genes and over 6,000 mammary genes were identified in the bovine genome. Intersection of these genes with 238 milk production quantitative trait loci curated from the literature decreased the search space for milk trait effectors by more than an order of magnitude. Genome location analysis revealed a tendency for milk protein genes to be clustered with other mammary genes. Using the genomes of a monotreme (platypus), a marsupial (opossum), and five placental mammals (bovine, human, dog, mice, rat), gene loss and duplication, phylogeny, sequence conservation, and evolution were examined. Compared with other genes in the bovine genome, milk and mammary genes are: more likely to be present in all mammals; more likely to be duplicated in therians; more highly conserved across Mammalia; and evolving more slowly along the bovine lineage. The most divergent proteins in milk were associated with nutritional and immunological components of milk, whereas highly conserved proteins were associated with secretory processes.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>Although both copy number and sequence variation contribute to the diversity of milk protein composition across species, our results suggest that this diversity is primarily due to other mechanisms. Our findings support the essentiality of milk to the survival of mammalian neonates and the establishment of milk secretory mechanisms more than 160 million years ago.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="cross_series_title" id="bovine">Bovine: the companion papers for the publication of the bovine genome sequence</classification>
         <classification type="BMC" subtype="cross_series_editor" id="bovine"/>
         <classification type="BMC" subtype="man_spc_id" id="30010005">Development</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010008">Evolution</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010018">Physiology</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>With the arrival of the <it>Bos taurus </it>genome assembly, bovine milk and lactation data can be linked to other mammalian genomes for the first time, allowing us to gain additional insight into the molecular evolution of milk and lactation. Mammals are warm-blooded vertebrate animals that nourish their young with milk produced by mammary glands. They first appeared approximately 166 million years ago, but their evolution can be traced back 310 million years when synapsids first branched from amniotes <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Two subclasses of mammals evolved, the prototherians and therians. Prototheria are monotremes, mammals that lay eggs; extant species include the platypus and enchidnas. Theria are mammals that bear live young; they are divided into the infraclasses Metatheria or marsupials - which include kangaroos and opossums - and the more common Eutheria or placental mammals - which include, for example, humans, dogs, mice, rats, and bovine species. Figure <figr fid="F1">1</figr> shows the mammalian phylogenetic tree with approximate divergence times <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>. Of the mammalian species listed, high coverage genomic data are available for the platypus (<it>Ornithorhynchus anatinus</it>), a prototherian, the opossum (<it>Monodelphis domestica</it>), a metatherian, and a number of placental mammals, including human (<it>Homo sapiens</it>), rat (<it>Rattus norvegicus</it>), mouse (<it>Mus musculus</it>), dog (<it>Canis familiaris</it>), and now bovine (<it>Bos taurus</it>).</p>
         <fig id="F1">
            <title>
               <p>Figure 1</p>
            </title>
            <caption>
               <p>Simplified phylogenetic tree illustrates relationships of representative extant Mammalian species</p>
            </caption>
            <text>
               <p>Simplified phylogenetic tree illustrates relationships of representative extant Mammalian species. Estimates in millions of years ago (MYA) of origin of each major branch were derived from Bininda-Emonds <it>et al</it>. <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>. The two earliest splits established monotremes, (166.2 MYA), and marsupials and placentals (147.7 MYA). Approximately 50 million years pass before the origination of any extant groups, and then the four placental superorders (italicized capitals) arose within 2.4 million years of each other.</p>
            </text>
            <graphic file="gb-2009-10-4-r43-1"/>
         </fig>
         <p>The reproductive strategy, developmental requirements of the young, and environment of the maternal-infant pair are thought to drive variation in milk composition among species. Platypus and opossum neonates are embryonic in appearance and dependent on milk for growth and immunological protection during the equivalent of the fetal period in placental mammals <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>. In contrast, placental mammals have relatively longer gestation and shorter lactation periods. These reproductive strategies directly impact milk composition as the immature monotreme and marsupial young have different needs with regard to growth, development, and adaptive immunity. Other aspects of the reproductive strategy, such as the length of the lactation period and the maternal nutritional strategy, can also impact milk composition. For example, mammals that fast or feed little during lactation produce milks low in sugar but high in fat to minimize energy and water demands while sustaining nutrient transfer to the young <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. The data in Table <tblr tid="T1">1</tblr> illustrate that even the gross macronutrient composition of milk can be highly variable among species.</p>
         <tbl id="T1">
            <title>
               <p>Table 1</p>
            </title>
            <caption>
               <p>Gross macronutrient composition of mammalian milk</p>
            </caption>
            <tblbdy cols="4">
               <r>
                  <c ca="left">
                     <p>Species</p>
                  </c>
                  <c ca="center">
                     <p>Fat %</p>
                  </c>
                  <c ca="center">
                     <p>Crude protein %</p>
                  </c>
                  <c ca="center">
                     <p>Lactose and sugar %</p>
                  </c>
               </r>
               <r>
                  <c cspan="4">
                     <hr/>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Bovine <abbrgrp><abbr bid="B76">76</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>3.7 (3.5-5.5)</p>
                  </c>
                  <c ca="center">
                     <p>3.4</p>
                  </c>
                  <c ca="center">
                     <p>4.6</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Dog <abbrgrp><abbr bid="B77">77</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>9.5</p>
                  </c>
                  <c ca="center">
                     <p>7.5</p>
                  </c>
                  <c ca="center">
                     <p>3.8</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Human <abbrgrp><abbr bid="B76">76</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>4</p>
                  </c>
                  <c ca="center">
                     <p>1</p>
                  </c>
                  <c ca="center">
                     <p>7</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Mouse <abbrgrp><abbr bid="B77">77</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>27</p>
                  </c>
                  <c ca="center">
                     <p>12.5</p>
                  </c>
                  <c ca="center">
                     <p>2.6</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Rat <abbrgrp><abbr bid="B77">77</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>8.8</p>
                  </c>
                  <c ca="center">
                     <p>8.1</p>
                  </c>
                  <c ca="center">
                     <p>3.8</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Opossum <abbrgrp><abbr bid="B78">78</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>7.4</p>
                  </c>
                  <c ca="center">
                     <p>10</p>
                  </c>
                  <c ca="center">
                     <p>10 (oligosaccharides)</p>
                  </c>
               </r>
               <r>
                  <c ca="left">
                     <p>Platypus <abbrgrp><abbr bid="B77">77</abbr></abbrgrp></p>
                  </c>
                  <c ca="center">
                     <p>22.2</p>
                  </c>
                  <c ca="center">
                     <p>8.2</p>
                  </c>
                  <c ca="center">
                     <p>3.7 (difucosylactose)</p>
                  </c>
               </r>
            </tblbdy>
         </tbl>
         <p>Because bovine milk is a major human food and agro-economical product, comparison of bovine milk with the milk of other species in the context of the bovine genome sequence is important not only to improve our understanding of mammary evolution but also of bovine milk production and human nutrition. The importance of bovine milk consumption to humans is underscored by the domestication of cattle and the convergent evolution of lactase persistency in diverse human populations <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. The availability of the bovine genome sequence provides unique opportunities to investigate milk and lactation. Lactation has been studied more extensively in <it>Bos taurus </it>than in other species, resulting in extensive milk proteome data, milk production quantitative trait loci (QTL), and over 100,000 mammary-related bovine expressed sequence tags (ESTs).</p>
         <p>In the present study, we identified the bovine lactation genome <it>in silico </it>and examined its content and organization. Utilizing the genomes of the seven mammals listed above and in Table <tblr tid="T1">1</tblr>, we investigated gene loss and duplication, phylogeny, sequence conservation, and evolution of milk and mammary genes. Given the conspicuous absence of some known abundant proteins, such as beta-lactoglobulin and whey acidic protein, in the milk of some species <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>, we hypothesized that variation in milk composition resides in part in variation in the milk protein genome. We show that gene duplication and genomic rearrangement contribute to changes in the milk protein gene complement of <it>Bos taurus </it>and other species. Although the casein proteins are highly divergent across mammalian milks <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>, we report that milk and mammary genes are more highly conserved, on average, than other genes in the bovine genome. Our findings illustrate the importance of lactation for the survival of mammalian species and suggest that we must look more deeply, perhaps into the non-coding regions of the genome that regulate milk protein gene expression, to understand the species-specificity of milk composition. Among mammals, we find milk proteins that are most divergent have nutritional and immunological functions, whereas the least divergent milk protein genes have functions that are important for the formation and secretion of mammalian milk. High conservation of milk fat globule membrane protein genes among the mammalian genomes suggests that the secretory process for milk production was firmly established more than 160 million years ago.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Milk and mammary gene sets</p>
            </st>
            <p>Two proteome studies of bovine milk <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp> were used to derive a milk protein gene set of 197 unique genes (see 'Collection of the milk protein set' in Materials and methods). Using 94,136 bovine mammary ESTs, mammary gene sets were created to represent the following developmental stages or conditions: virgin, 3,889 genes; pregnancy, 1,383 genes; lactation, 3,111 genes; involution, 867 genes; and mastitis, 840 genes (see 'Collection of the mammary gene sets' in Materials and methods). In total, 6,469 genes are constituents of one or more of these mammary gene sets, suggesting that one-quarter of all predicted genes are expressed in the mammary gland at some point during the lactation cycle. Genes from the milk protein and mammary gene sets are present on all 29 bovine autosomes and on the X chromosome (Figure <figr fid="F2">2</figr>).</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Distribution of milk and mammary genes across all bovine chromosomes</p>
               </caption>
               <text>
                  <p>Distribution of milk and mammary genes across all bovine chromosomes. In this chromosome map, each of the 30 bovine chromosomes is illustrated by a pair of columns, with genomic locations of milk and mammary genes in the first column, and milk-trait QTL in the second column. Note that the milk and mammary genes are distributed across all chromosomes.</p>
               </text>
               <graphic file="gb-2009-10-4-r43-2"/>
            </fig>
            <p>The milk protein gene set is the most extensive curation to date of genes that give rise to milk proteins, the functions of which have not yet been comprehensively studied. To gain insight into the possible molecular functions of milk proteins, the milk protein gene set was analyzed for enriched molecular function Gene Ontology (GO) terms (see Materials and methods). Four significant, minimally redundant molecular function GO terms were identified: 'GTPase activity,' 'GTP binding,' 'pattern recognition receptor activity,' and 'calcium ion binding.' More than 30 milk proteins that were previously isolated in the milk fat globule membrane <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp> were associated with 'GTPase activity' or 'GTP binding'. GTPases are known to be involved in numerous secretory processes, and for this reason, it seems likely that these proteins have a role in assembly and secretion of the milk fat globule and possibly other milk components. The 'pattern recognition receptor activity' GO term was enriched due to the presence in milk of the cell surface and immune recognition components CD14 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174008">NM_174008</ext-link>], TLR2 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174197">NM_174197</ext-link>], TLR4 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174198">NM_174198</ext-link>], and DMBT1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="S78981">S78981</ext-link>]. These proteins are involved in the activation of the innate immune system when they associate with cells. Further, the soluble forms of CD14 and TLR2, which can act as decoy receptors for microbial pathogens, could potentially modulate local inflammation following bacterial colonization in the neonate gut <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. Enrichment of the GO term 'calcium ion binding' was expected as many milk proteins are known to bind calcium, a mineral required in abundance by the growing neonate.</p>
            <p>Milk is traditionally thought of as a food that provides the neonate with nutrients and some immune protection, such as that provided by immunoglobulins. Prior research also suggests that various milk proteins are resistant to digestion by gastric proteases at physiological pH <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and that intact or partially intact milk proteins may either express their functions in the neonatal intestinal tract or may be absorbed and act on other organs <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>. To understand what signaling might be possible if milk proteins remain partially or wholly undigested, the milk protein gene set was interrogated for enriched pathway annotations (see 'Pathway analysis' in Materials and methods). The milk protein gene set contains elements of two marginally significant pathways that lead to activation of PPARalpha and LXR, two nuclear receptors involved in sensing nutrients and modifying metabolic responses at the level of gene transcription. Milk proteins that are associated with the LXR/RXR activation pathway include the cell surface or secreted molecules CD14 [GenBank:<ext-link ext-link-type="gen" ext-link-id=" NM_174008"> NM_174008</ext-link>], CD36 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174010">NM_174010</ext-link>], TLR4 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174198">NM_174198</ext-link>], and MSR1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001113240">NM_001113240</ext-link>], the apolipoproteins APOA1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174242">NM_174242</ext-link>] and APOE [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_173991">NM_173991</ext-link>] and the lipid synthesis enzymes ACACA [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174224">NM_174224</ext-link>] and FASN [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001012669">NM_001012669</ext-link>]. Those associated with the PPARalpha/RXRalpha activation pathway include the cell surface molecule CD36 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174010">NM_174010</ext-link>], the endoplasmic reticulum protein disulphide isomerase PDIA3 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174333">NM_174333</ext-link>], the apolipoprotein APOA1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174242">NM_174242</ext-link>], the transcription factor STAT5B [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174617">NM_174617</ext-link>], the heat shock protein HSP90AA1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001012670">NM_001012670</ext-link>], the regulator of adenylate cyclase GNAS [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_181021">NM_181021</ext-link>], and two enzymes involved in lipid synthesis, GPD2 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001100296">NM_001100296</ext-link>] and FASN [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001012669">NM_001012669</ext-link>]. It is likely that the products of these genes, which are well known to be active at metabolic control points in many organs, are active in the mammary gland and then enter the milk via cytoplasmic crescents in the milk fat globules. Keenan and Patton <abbrgrp><abbr bid="B17">17</abbr></abbrgrp> noted that cytoplasmic sampling, as part of milk fat globule formation, is present in all species examined to date, including humans, and that such evolutionary persistence suggests possible benefits for mother or offspring. Further research will be needed to determine whether these proteins are present in milk at sufficient quantities to have a physiological effect in the neonate.</p>
            <p>All mammary gene sets were interrogated for enrichment of GO terms or pathway annotations, but the results did not further our knowledge of mammary biology. Consistent with our previous study <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, current GO term annotations were incomplete or generally out of context when applied to the mammary gland. Although bovine EST data indicate that more than 3,000 genes are expressed in the lactating mammary gland, a mere 22 genes are currently annotated with the GO term 'lactation.'</p>
         </sec>
         <sec>
            <st>
               <p>Bovine milk production QTL</p>
            </st>
            <p>Milk trait QTL delineate gene regions that harbor genes or <it>cis</it>-acting elements that are responsible for the milk trait phenotype. The dairy industry has invested enormous resources into the identification of these QTL for milk production traits in bovine, particularly milk yield, protein yield, fat yields, protein percentage, and fat percentage. Reviewing the literature, 238 milk trait QTL were identified for these five traits in 59 references (Additional data files 8-9). Of the 238 QTL, 63 were reported with flanking markers having a median interval size of approximately 17 million base pairs. Following a previously established method <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>, the 175 remaining QTL that were reported with only a single peak marker were assigned this median interval size. Some QTL were reported for more than one milk trait; thus, these QTL span only 168 unique genome locations. These milk trait QTL span all 29 autosomes (Figure <figr fid="F2">2</figr>), with the highest densities of QTL occurring on chromosomes 27, 6, 20, and 14 (Additional data file 10). Possible differences in genetic architecture are most obvious between fat and protein percentage traits, where fat percentage QTL are present on fewer chromosomes with lower QTL density and protein percentage QTL are present on all but two chromosomes, most with higher QTL density (Additional data file 10). Fat percentage may be controlled by relatively fewer genes each with larger effects, whereas protein percentage may be controlled by far more genes each with smaller effects.</p>
            <p>The milk trait QTL provide a very coarse map of genomic areas of interest that cover nearly half of the bovine assembly. Milk yield QTL overlap with 19.5% of the genomic assembly, fat yield QTL with 15.4%, protein yield QTL with 21.1%, fat percentage QTL with 12.3%, and protein percentage QTL with 33.6% of the genome assembly. The densities of genes within these QTL are very similar for each milk trait, with between 9.1 and 10.1 genes per million base pairs. Meanwhile, there are 8.4 genes per million base pairs in regions that do not overlap with any milk trait QTL. Given the gene density and number of QTL associated with each trait, each individual QTL is expected to contain between 105 and 127 genes.</p>
            <p>To identify candidate genes within milk trait QTL, the lactation mammary gene set was intersected with the milk trait QTL. Between 12.5% and 13.7% of the genes within milk trait QTL are expressed during lactation. In other words, within a single milk trait QTL, between 13.9 and 17.1 genes are expected to be expressed during lactation. Thus, although the set of milk trait QTL reduces the search space for milk trait effectors by less than one order of magnitude, the use of expression data can contribute considerably towards the identification of candidate genes. Genes within milk trait QTL that are expressed in the mammary gland during lactation are listed in Additional data files 11-16. Milk trait effectors are likely to be near these candidate genes.</p>
         </sec>
         <sec>
            <st>
               <p>Genome organization of milk and mammary genes</p>
            </st>
            <p>Studies of eukaryotic genomes have demonstrated that genes with coordinated expression or shared ancestry appear in clusters across the genome <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. Given that the clustering of the casein milk protein genes is essential to their coordinated transcription in the lactating mammary gland <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>, the arrival of the bovine genome sequence provides the opportunity to discover other gene clusters relevant to milk, lactation, or mammary biology. A genome-wide search was conducted for genomic intervals of 500 kb and greater that are statistically enriched with genes from the milk protein and mammary gene sets (see 'Genomic localization analysis' in Materials and methods). Among these gene sets, 190 non-overlapping statistically significant clusters were identified: four unique clusters in the milk protein gene set and 54, 60, 30, and 19 unique clusters in the pregnancy, lactation, involution, and mastitis mammary gene sets, respectively. Spreadsheets of all significant gene clusters are available in Additional data files 17 and 18.</p>
            <p>The four significant milk protein gene clusters comprised the immunoglobulin genes, casein genes, fibrinogen genes, and genes that encode milk fat globule proteins. Because it is known that immunoglobulins, casein genes, and fibrinogen genes are each clustered in mammalian genomes <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr></abbrgrp>, this is a good verification of methodology. The cluster of genes that encode milk fat globule proteins contains FASN [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001012669">NM_001012669</ext-link>], ARHGDIA [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_176650">NM_176650</ext-link>], and P4HB [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174135">NM_174135</ext-link>]. However, P4HB has only been isolated in mastitic milk <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. By manual inspection, we found that these genes also cluster in the human, mouse, and other mammalian genomes. Based on EST data, other genes in this genomic region are expressed at various times in the mammary gland. Aside from these four clusters, there does not appear to be a preponderance of putative regulatory modules among genes in the milk protein gene set. Whereas only 6.6% of the milk protein genes were within a milk protein-specific cluster, 27.9% were within one of the mammary gene set clusters. Therefore, it is likely that milk protein genes are regulated along with other mammary genes independent of the function or cellular localization of the proteins they encode.</p>
            <p>Next, we examined whether genes were clustered according to developmental stage, but found there were no gross differences in gene clustering using this parameter. Between 24% and 30% of the genes from each mammary gene set - virgin, pregnancy, lactation, and involution - were within one of the other mammary set clusters. Likewise, 28% of the genes from the mastitis mammary gene set fell within a mammary cluster. Thus, mammary genes are not differentially clustered by developmental stage or condition.</p>
            <p>Genes may be clustered due to shared evolution, as duplicated genes are often co-localized in the genome. In our study, a significant cluster required a minimum of three genes that were not paralogs. When the paralog requirement was removed, only seven additional unique clusters of triplets or greater were identified. Significant clusters with more than one paralog appear to be confined to the major histocompatibility complex region on bovine chromosome 23. These data suggest that recent duplication is not a common driver of clustered mammary genes in the bovine genome.</p>
            <p>In summary, the milk protein genes generally do not form clusters with each other but do appear to form clusters with other mammary genes. Milk protein genes may be regulated along with other lactation genes without regards to the final destination of the gene product. As mammary genes are generally clustered neither by developmental stage nor due to recent duplication, it appears that the need for co-expression in the mammary gland is the denominator for co-localization rather than co-functionality or shared ancestry. This organization in clusters of co-expressed mammary genes might be constrained by unidentified distal <it>cis</it>-acting elements <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, chromatin conformation <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>, or coordinately expressed micro-RNAs <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Milk and mammary gene copy number trends in mammals</p>
            </st>
            <p>Gene copy number contributes to genetic diversity both between and within species. Here, copy numbers of bovine milk protein genes were determined in the bovine, human, mouse, rat, dog, opossum, and platypus genomes using orthologs generated for all bovine consensus gene models (see 'Orthology delineation' in Materials and methods). Genes from the milk protein gene set that were uniquely duplicated in <it>B. taurus </it>and those that were missing copies in one or more of the placental mammals were manually curated (see 'Curation of milk protein orthologs' in Materials and methods). K-means clustering of these curated milk protein gene orthologs followed by seriation within each cluster yielded the heatmap shown in Figure <figr fid="F3">3</figr>. Three major trends were identified: single copy of the gene across Mammalia; gene not found in platypus; and duplication after platypus.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Heatmap of milk protein gene copy numbers across mammals</p>
               </caption>
               <text>
                  <p>Heatmap of milk protein gene copy numbers across mammals. Milk protein genes were clustered by copy number using the K-means algorithm followed by seriation within each cluster. Major trends, which convey the consensus profile of the cluster, are delineated by brackets. Most milk protein genes are either present as a single copy in each mammalian genome or as a single copy in all therian genomes. Duplicated genes are expanded after platypus in either a general or a species- or clade-specific manner. Black squares indicate that the gene was not found in a particular species, yellow-green squares indicate a single copy of the gene, and red squares indicate two or more copies of the gene. Brighter red squares indicate higher copy numbers.</p>
               </text>
               <graphic file="gb-2009-10-4-r43-3"/>
            </fig>
            <p>The absence of a milk or mammary gene in platypus or duplication after platypus (Figure <figr fid="F3">3</figr>) may be due to the expansion of gene families in the common therian ancestor. However, some of these genes may not be truly missing in the platypus genome, but may be undetectable by our methods due to incomplete or incorrect assembly of the platypus genome, lower sequence identity, or the inherent bias created by defining milk and mammary genes in the bovine genome. The identification of platypus orthologs of other genes in the bovine genome would also be affected by these biases; therefore, we next compared milk and mammary gene copy number trends to those genome-wide.</p>
            <p>For each major trend shown in Figure <figr fid="F3">3</figr>, rates of occurrence among the uncurated orthologs of the milk protein and lactation mammary gene sets were compared with the orthologs of all bovine consensus gene models using a hypergeometric distribution to determine statistical significance. More bovine milk protein orthologs were found in all six studied mammalian genomes than would be expected given the rate at which other bovine orthologs were found in these genomes (<it>P </it>&lt; 0.0001). Genes expressed during bovine lactation were also more likely than other genes to have orthologs in all of the mammalian genomes (<it>P </it>&lt; 0.0001). In other words, milk and mammary genes are more likely than other genes to be found in all mammals. This result might be explained in part by an increased power to detect more conserved genes (see 'Conservation of milk and mammary genes in mammals' below). There were also statistically fewer lactation genes missing in the platypus (<it>P </it>&lt; 0.005) and opossum genomes (<it>P </it>&lt; 2.2 &#215; 10<sup>-20</sup>); however, the number of milk protein genes missing in these genomes did not differ from the genome-wide rate. Finally, more milk protein and lactation genes were duplicated after platypus compared with the whole genome (<it>P </it>&lt; 0.001 and <it>P </it>&lt; 0.03, respectively). Together, these data support the essentiality of milk and mammary genes in Mammalia as well as suggest the possibility for expanded functionality in marsupials and placental mammals.</p>
            <p>Milk protein gene copy number variation may potentially contribute to the diversity of milk composition. Ortholog analysis indicated that the gene for beta-lactoglobulin (LGB), one of the most abundant proteins in milk, is duplicated in the dog and bovine genomes (Figure <figr fid="F3">3</figr>). In the bovine genome, this gene is located at the position of a previously predicted pseudogene <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. It has similarity to LGB-II genes in the horse and cat <abbrgrp><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr></abbrgrp>. The similarity of this second gene to LGB-II in the horse, cat, and dog suggests that the LGB duplication existed in the common ancestor of the laurasiathians (Figure <figr fid="F1">1</figr>). Using two different primer pairs, we were unable to identify the LGB-II transcript in bovine mammary tissue samples using RT-PCR (see Additional data file 22 for details). It is likely that the duplicated LGB gene is not expressed in the bovine mammary gland and that the presence of this duplication does not influence the concentration of LGB in bovine milk.</p>
            <p>LGB is apparently not present in human or mouse milk <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>, although LGB-like proteins have been isolated from the milk of other primates <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr><abbr bid="B33">33</abbr></abbrgrp>. A human protein, progestagen-associated endometrial protein (PAEP), has significant homology to the bovine and equine LGB-II-like genes <abbrgrp><abbr bid="B29">29</abbr><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr></abbrgrp>. Although PAEP expression has been detected in the epithelial cells of human breast tissue <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>, neither its presence nor that of an apparent LGB-like pseudogene [GenBank:<ext-link ext-link-type="gen" ext-link-id="AH011480">AH011480</ext-link>] that flanks the PAEP gene [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001018049">NM_001018049</ext-link>] has been verified in human milk. We found that the LGB-like and PAEP genes are flanked by GLT6D1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_182974">NM_182974</ext-link>] and OBP2A [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_014582">NM_014582</ext-link>] in both the human and bovine genomes. This observation, combined with the fact that the baboon has both a PAEP gene <abbrgrp><abbr bid="B38">38</abbr></abbrgrp> and a LGB gene <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>, suggests that the primate genes arose by duplication of an ancestral gene before the Laurasiatheria and Eurochontoglires diverged. We were unable to find this region in the rodent or rabbit genomes, and an evolutionary break point is present in mouse and rat in this region <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>, suggesting that these genes may have been lost after the split between primates and glires. Although the presence of LGB in laurasiathian milk and its absence in rodent milks has an obvious genetic basis, we cannot yet explain the absence of LGB in human milk.</p>
            <p>Some immune components of milk are uniquely duplicated in certain species or clades. For example, SAA3 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_181016">NM_181016</ext-link>], which is duplicated in the bovine and dog genomes (Figure <figr fid="F3">3</figr>), is thought to be involved in mucin induction in the gut <abbrgrp><abbr bid="B40">40</abbr><abbr bid="B41">41</abbr></abbrgrp> and a human analog, SAA1, functions as an opsonin for Gram-negative bacteria <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. The Cathelicidin gene family is greatly expanded in the bovine, opossum, and platypus genomes, with 10, 8, and 12 copies, respectively <abbrgrp><abbr bid="B43">43</abbr><abbr bid="B44">44</abbr><abbr bid="B45">45</abbr></abbrgrp>, but some of the opossum and platypus orthologs were not found in our automated analysis due to their high heterogeneity. Expansions in this gene family may reflect increased exposure to bacteria at epithelial surfaces in these species. Our results show that the CD36 gene [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174010">NM_174010</ext-link>], which encodes a scavenger receptor, has duplications in the <it>B. taurus </it>and rat genomes. Beta-2-microglobulin [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_173893">NM_173893</ext-link>] has a second copy in the bovine genome and may also have a duplicate in the platypus genome. This gene encodes one of two chains in the IgG transporter FcRn, which transfers IgG molecules across epithelial cells <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. Other variations in milk protein gene copy number (Figure <figr fid="F3">3</figr>) potentially give rise to diversity in milk protein composition.</p>
            <p>Milk protein gene loss does not appear to be a common occurrence. Of the bovine milk protein genes with an ortholog identified in the platypus genome (Figure <figr fid="F3">3</figr>), all but ten genes were found in all of the other studied mammalian genomes. However, because the bovine milk proteome is used as the reference, the loss of some milk protein genes in placental mammals relative to the monotreme and marsupial mammals may have been missed in our analysis. For example, whey acidic protein has been identified in the milk of many mammals such as mouse, rat, opossum, and platypus, but it is absent in bovine milk due to a frameshift mutation in the whey acidic protein gene <abbrgrp><abbr bid="B47">47</abbr></abbrgrp>. A full proteomic analysis of the milk samples from extant monotremes and marsupials will be needed to identify gene loss in placental mammals.</p>
            <p>Our analysis of milk protein gene copy numbers has several other limitations. First, the mammalian orthologs of bovine consensus gene models derived on a genome-wide basis (see 'Orthology delineation' in Materials and methods) may be inaccurate for genes in which the bovine gene model is incorrect or may be incomplete when orthologs are too divergent to be detected by this method. Although we attempted to overcome these limitations by manually curating milk protein gene orthologs, the analysis is only as good as the available genome sequences, and some duplications and deletions may have been missed due to errors and gaps in the genome assemblies. Directed sequencing will be needed to confirm specific results. However, we can generally conclude that there is considerable copy number variation of milk protein genes that may contribute to the taxonomic diversity of milk composition.</p>
         </sec>
         <sec>
            <st>
               <p>Taxonomic relationships of the milk protein genes</p>
            </st>
            <p>To understand the relationships of the milk proteins between mammalian taxa, a consensus tree of those milk proteins with single copy orthologs in the human, mouse, rat, dog, bovine, opossum, and platypus genomes was constructed using a super-alignment of the concatenated sequences (see 'Consensus tree construction' in Materials and methods). An unrooted radial tree depicting the relationships of the milk protein sequences (Figure <figr fid="F4">4</figr>) differs from the accepted phylogeny (Figure <figr fid="F1">1</figr>). Rodent milk proteins are more divergent from human milk proteins than are dog and bovine milk proteins despite the fact that the rodent and human common ancestor is more recent. To further test the relationships of human milk proteins with those of other taxa, pairwise percent identity (PID) was calculated between the human protein and its putative ortholog for the set of single copy orthologs present in all seven taxa. Average pairwise PIDs for the milk protein gene set confirm that human milk proteins are closest to dog, followed by bovine, then the rodents, then opossum and platypus (Figure <figr fid="F5">5</figr>). This observation is not unique to milk proteins as it is also true on a genome-wide basis <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. It has been proposed that rodent proteins are more divergent from human than are bovine proteins because rodents have a faster reproductive rate and are, therefore, evolving more quickly <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. Although rodent milk proteins may appear more distant from human milk proteins than are bovine milk proteins, whether these differences have functional importance is a matter for future scientific inquiry.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Relationships between the milk protein sequences of mammalian taxa</p>
               </caption>
               <text>
                  <p>Relationships between the milk protein sequences of mammalian taxa. This milk protein consensus tree, which is incongruous with the accepted phylogeny shown in Figure 1, was derived from a super-alignment of milk protein amino acid sequences for those genes with single copy orthologs in all seven species. The numbers indicate the percent of bootstraps that support the internal branch and the length of the scale bar represents the number of amino acid substitutions per unit site.</p>
               </text>
               <graphic file="gb-2009-10-4-r43-4"/>
            </fig>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Pairwise percent identity of human milk proteins with milk proteins of other species</p>
               </caption>
               <text>
                  <p>Pairwise percent identity of human milk proteins with milk proteins of other species. Bars depict the average amino acid (AA) pairwise percent identity between human milk proteins and those of the species named on the x-axis. Note that human milk proteins are more similar to those of dog and bovine than to rodents and the other species depicted.</p>
               </text>
               <graphic file="gb-2009-10-4-r43-5"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Conservation of milk and mammary genes in mammals</p>
            </st>
            <p>To determine whether milk and lactation-related genes are more or less conserved across mammals than other genes, average PIDs of the 21 pairwise comparisons of the seven taxa were computed on a genome-wide basis for all bovine consensus gene models and genes from the milk protein and mammary gene sets with single copy orthologs in these taxa (Figure <figr fid="F6">6</figr>). The distribution of the average pairwise PIDs of the milk protein gene set did not significantly differ from the whole genome distribution, nor did the means of the two distributions significantly differ (see 'Statistical analysis of PID distributions' in Materials and methods). However, when the sample size was increased by individually assessing pairwise PIDs between human and each of the seven taxa, requiring in each case that orthologs be single copies only in bovine and the two taxa being compared, milk protein sequences were statistically more conserved between human and other mammals than the products of other genes in the genome (see Additional data file 20 for details). The human-bovine distribution is most dramatically different from the whole genome as a full quarter of the set of the 137 milk protein genes with single copies in these two genomes are very highly conserved with a pairwise PID of 97.5% or greater.</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Average pairwise percent identities of milk and mammary genes across mammals</p>
               </caption>
               <text>
                  <p>Average pairwise percent identities of milk and mammary genes across mammals. The distribution of average amino acid pairwise PID of amino acid sequences across the seven taxa - human, mouse, rat, bovine, dog, opossum, and platypus - is plotted for those genes in the virgin, pregnancy, lactation, involution, and mastitis mammary gene sets, the milk protein gene set, and all bovine consensus genes. Only genes with a single copy in each of the seven genomes were used for the analysis. Milk and mammary genes are more conserved across mammals than other genes in the genome.</p>
               </text>
               <graphic file="gb-2009-10-4-r43-6"/>
            </fig>
            <p>Of the average pairwise PID distributions of the mammary gene sets in Figure <figr fid="F6">6</figr>, all are significantly different from the genome-wide distribution. The means of their distributions also differ from the genome-wide mean. As a group, mammary genes of every developmental stage and condition appear to be more conserved across Mammalia, on average, than other genes in the genome.</p>
            <p>To discover which milk proteins are most conserved in mammals, the average pairwise PIDs among the seven mammalian taxa were computed for all genes from the milk protein gene set with single copy orthologs in the manually curated set (see 'Curation of milk protein orthologs' in Materials and methods). The top 25 most conserved milk proteins across all seven mammals are listed in Table <tblr tid="T2">2</tblr>. These proteins have greater than 95% identity across mammals, some more than 99%, despite the fact that they have not shared a common ancestor for more than 160 million years. Based on the amino acid length and conservation, we can predict that these milk proteins have a small size with functions that depend on strictly conserved structure.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Highly conserved milk proteins</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Protein name</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN ID*</p>
                     </c>
                     <c ca="left">
                        <p>Gene symbol</p>
                     </c>
                     <c ca="center">
                        <p>Average PID</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 11A</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_20537</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB11A</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GTP binding protein G I G S G T beta subunit 1</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_21827</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>GBB1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GTP binding regulatory protein beta 2 chain</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_22534</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>GNB2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rho C</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_13128</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RHOC</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 11B</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_03051</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB11B</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rap 1b</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_10112</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAP1B</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GTP binding protein Sara</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_16602</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>SAR1A</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 3A</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_02763</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB3A</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Histone 2, H2ab</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_23583</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HIST2H2AB</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>99.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>SAR1B protein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_08536</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>SAR1B</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>14-3-3 protein beta alpha</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_04527</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>YWHAB</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Leucine-rich repeat containing protein 8</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_26477</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>LRC8A</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 18</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_21462</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB18</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rho GDP-dissociation</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_11194</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>ARHGDIA</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 5C</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_17381</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB5C</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AD158</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_08550</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>LRC8C</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 3C</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_20950_P10949</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB3C</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Eukaryotic translation initiation factor 4, gamma 2</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_19671</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>EIF4G2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>ATP synthase, H+ transporting, mitochondrial F1 complex, alpha subunit</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_03119</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>ATP5A1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>ARP3 (actin-related protein 3, yeast) homolog</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_25161</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>ACTR3</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Vimentin</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_20783</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>VIM</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GTP binding protein alpha 14</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_08781</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>GNA14</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Endoplasmin precursor (GRP94/GP96)</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_20794</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>HSP90B1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lymphocyte cytosolic protein 1 (65 K macrophage protein/L-plastin)</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_05236</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>LCP1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>97.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Retinal short-chain dehydrogenase/reductase</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_03662</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>SDR1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>96.9</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Manually curated full length sequences are indicated by the following accession format: GLEAN_ID_ACCESSION where ACCESSION is the UniProt accession for the replacement amino acid sequence and GLEAN_ID is the bovine consensus gene identifier for the original sequence.</p>
               </tblfn>
            </tbl>
            <p>Nearly all of the highly conserved milk proteins (Table <tblr tid="T2">2</tblr>) are found in the milk fat globule membrane proteome. GO analysis of these proteins yields four enriched terms: 'GTPase activity,' 'GTP binding,' 'small GTPase mediated signal transduction,' and 'intracellular protein transport.' Twelve of the proteins listed in Table <tblr tid="T2">2</tblr> are annotated with one or more of these GO terms. GTPases are known to be involved in the exocytotic pathway by which proteins are trafficked from the Golgi compartment to the plasma membrane. Further, GBB1 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_175777">NM_175777</ext-link>], RAB11B [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001035391">NM_001035391</ext-link>], RAP1B [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_175824">NM_175824</ext-link>], YWHAB [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174794">NM_174794</ext-link>], and RAB18 [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001075499">NM_001075499</ext-link>] listed in Table <tblr tid="T2">2</tblr> have previously been isolated in Golgi fractions from the mammary glands of pregnant and lactating rats <abbrgrp><abbr bid="B48">48</abbr></abbrgrp>. An additional four milk proteins, SAR1A [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001034521">NM_001034521</ext-link>], SAR1B [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001035315">NM_001035315</ext-link>], RAB3A [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174446">NM_174446</ext-link>], and RAB3C [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001046606">NM_001046606</ext-link>], are annotated with the GO term 'secretory pathway.' The finding that so many of these secretion-related proteins are associated with the milk fat globule membrane suggests they may also be involved in the highly specialized process by which the milk fat globule is secreted or that the exocytotic and lipid secretion pathways intersect at some point during the secretion process. Because the conserved proteins listed in Table <tblr tid="T2">2</tblr> are related to the generic molecular function of secretion, it seems highly likely that they facilitate the secretion of milk lipid.</p>
            <p>Conservation of mammary genes relative to other genes in the genome suggests hypotheses about the evolution of milk production. First, conservation of mammary genes involved in all developmental stages supports the hypothesis that, at the genetic level, the basic biological transformation of the virgin gland through pregnancy, lactation, and involution is conserved among all mammals, and occurred by co-opting existing structures and developmental pathways. Second, many of the most highly conserved proteins found in milk are constituents of the milk fat globule membrane and are known to be part of the secretory process. High conservation of these genes between platypus, opossum, and the placental mammals indicates that molecular mechanisms of secretion were already in place 160 million years ago.</p>
         </sec>
         <sec>
            <st>
               <p>Divergent milk protein genes in mammals</p>
            </st>
            <p>Because the technique for ortholog detection relies on a minimum threshold of conservation, orthologs of many of the more divergent proteins could not be found in the platypus or opossum genomes. Therefore, to determine which proteins in milk are most divergent in mammals, average PIDs were computed across only the five placental mammals. The 25 most divergent milk proteins across placental mammals are presented in Table <tblr tid="T3">3</tblr>. These milk proteins are primarily secreted or cell-surface proteins with structures that are apparently not constrained by function relative to other proteins in milk. Four GO terms associated with these proteins are enriched: 'pattern binding,' 'response to other organism,' 'inflammatory response,' and 'extracellular space.'</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Highly divergent milk proteins</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Protein name</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN ID*</p>
                     </c>
                     <c ca="left">
                        <p>Gene symbol</p>
                     </c>
                     <c ca="center">
                        <p>Average PID</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Alpha-S1-casein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_22124_P02662</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>CSN1S1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>44.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>G protein Xlalphas</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_10239</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>GNAS</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>48.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Kappa casein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_22128</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>CSN3</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>51.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Mucin 1</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_00552</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MUC1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>52.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Beta casein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_22133</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>CSN2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>55.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 10</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_18819_A6QLS9</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB10</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>57.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>SCAMP2</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_09359_A6QR35</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>SCAMP2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>63.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Fetuin</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_07528</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>AHSG</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>64.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Immunoglobulin IgM</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_18189</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>IgM</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>65.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Polymeric-immunoglobulin receptor precursor</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_25657</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>PIGR</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>66.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Keratin 9</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_21315</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>KRT9</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>66.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>CD14</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_04279</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>CD14</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>68.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Rab 7</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_25742</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>RAB7A</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>68.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Peptidoglycan recognition protein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_12036</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>PGLYRP1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>68.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Fibrinogen alpha chain</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_24372</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>FGA</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>68.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Apolipoprotein B</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_00959</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>APOB</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>69.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Apolipoprotein E</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_10715</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>APOE</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>70.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Glycoprotein antigen MGP57/53 (lactadherin/bP47 protein)</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_17418</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MFGE8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>70.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Toll-like receptor 4</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_05263</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>TLR4</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>70.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Alpha-lactalbumin</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_17221</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>LALBA</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>70.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>MUC15 protein</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_04480</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MUC15</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>71.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Macrophage scavenger receptor types I and II</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_13926</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>MSR1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>72.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Toll-like receptor 2</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_24366</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>TLR2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>73.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Albumin (precursor)</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_11814</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>ALB</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>74.6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chitinase-like protein 1 (CLP-1)</p>
                     </c>
                     <c ca="left">
                        <p>GLEAN_07846</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>CHI3L1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>76.3</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Manually curated full length sequences are indicated by the following accession format: GLEAN_ID_ACCESSION where ACCESSION is the UniProt accession for the replacement amino acid sequence and GLEAN_ID is the bovine consensus gene identifier for the original sequence.</p>
               </tblfn>
            </tbl>
            <p>The greatest inter-species divergence among milk protein sequences occurs with those proteins that are most abundant in milk (caseins, alpha-lactalbumin (LALBA)), those most abundant in plasma (fetuin, albumin), and with those contributing to immunity. The casein proteins are the most divergent of the milk proteins, with an average pairwise PID of only 44-55% across placental mammals. Nutritionally, the caseins provide the suckling neonate with a source of amino acids and with highly bioavailable calcium. Additionally, peptides derived from partially digested caseins have potential anti-microbial, immune-modulating, and other bioactive properties. The fact that the caseins are the most divergent of the milk proteins suggests that the nutritional and immunological functions of these proteins do not particularly constrain their amino acid sequence and structure.</p>
            <p>The sequence divergence of LALBA is surprising given its essentiality to the synthesis of lactose, the primary source of digestible carbohydrate. <it>LALBA </it>encodes a protein that forms the regulatory subunit of the lactose synthase heterodimer. However, additional functions of LALBA have emerged. When human LALBA is partially unfolded and bound to oleic acid, it functions as an apoptotic factor that kills tumor cells and immature cells, but not healthy differentiated cells <abbrgrp><abbr bid="B49">49</abbr></abbrgrp>. Thus, it is possible that this variant of LALBA protects the gut of the human neonate. Furthermore, the apoptotic capabilities of LALBA appear to be utilized in the regulation of involution of the mammary gland. A recent study suggests that Cape fur seals escape apoptosis and involution of the mammary gland during long foraging trips because they lack the LALBA protein <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. While lactose synthesis may be a common essential function, it appears that it does not overly constrain the sequence divergence of LALBA. The sequence divergence of LALBA may rather be related to the potential of this protein to modulate species-specific strategies related to immune function and the regulation of the mammary gland.</p>
            <p>The most divergent immune-related proteins in milk are products of the following genes: <it>mucin 1 </it>(<it>MUC1</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174115">NM_174115</ext-link>], <it>immunoglobulin IgM </it>[GenBank:<ext-link ext-link-type="gen" ext-link-id="BC114809">BC114809</ext-link>], <it>polymeric-immunoglobulin receptor </it>(<it>PIGR</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174143">NM_174143</ext-link>], <it>peptidoglycan recognition protein </it>(<it>PGLYRP1</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174573">NM_174573</ext-link>], <it>CD14 </it>[GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174008">NM_174008</ext-link>], <it>Toll-like receptor 2 </it>(<it>TLR2</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174197">NM_174197</ext-link>], <it>Toll-like receptor 4 </it>(<it>TLR4</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174198">NM_174198</ext-link>], <it>macrophage scavenger receptor types I and II </it>(<it>MSR1</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001113240">NM_001113240</ext-link>], and <it>chitinase-like protein 1 </it>(<it>CHI3L1</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001080219">NM_001080219</ext-link>]. In milk, CD14 and TLR2 are present in soluble forms and may neutralize pathogens by binding to them as decoy receptors <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. MUC1 prevents the binding of pathogenic bacteria to epithelial cells <it>in vitro </it>(R.L. Tellam, personal communication). Our finding that the most divergent milk protein genes are those that confer immunity presumably reflects a flexibility to confront a wide variety of pathogen challenges.</p>
         </sec>
         <sec>
            <st>
               <p>Evolution of milk and mammary genes along the bovine lineage</p>
            </st>
            <p>To investigate the selective constraints on the evolution of bovine milk and mammary genes, the rate of non-synonymous substitutions per non-synonymous site (d<sub>N</sub>) to synonymous substitutions per synonymous site (d<sub>S</sub>) was estimated for proteins in each gene set using bovine genes and their putative orthologs in the human and mouse genomes (see 'Evolutionary analysis along the bovine lineage' in Materials and methods for details). The average d<sub>N</sub>/d<sub>S </sub>ratio of the genes from the milk protein and mammary gene sets (Table <tblr tid="T4">4</tblr>) was significantly below the genome average (Mann-Whitney U test, <it>P </it>&lt; 0.05), indicating that milk and mammary genes are subject to more stringent selective constraint than other genes in the bovine genome.</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>Milk and mammary gene average d<sub>N</sub>/d<sub>S</sub></p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>Gene set</p>
                     </c>
                     <c ca="center">
                        <p>Number of genes with computed d<sub>N</sub>/d<sub>S</sub></p>
                     </c>
                     <c ca="center">
                        <p>Average d<sub>N</sub>/d<sub>S</sub></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Milk protein</p>
                     </c>
                     <c ca="center">
                        <p>149</p>
                     </c>
                     <c ca="center">
                        <p>0.13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Virgin mammary</p>
                     </c>
                     <c ca="center">
                        <p>3,091</p>
                     </c>
                     <c ca="center">
                        <p>0.13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pregnancy mammary</p>
                     </c>
                     <c ca="center">
                        <p>1,032</p>
                     </c>
                     <c ca="center">
                        <p>0.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lactation mammary</p>
                     </c>
                     <c ca="center">
                        <p>2,477</p>
                     </c>
                     <c ca="center">
                        <p>0.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Involution mammary</p>
                     </c>
                     <c ca="center">
                        <p>704</p>
                     </c>
                     <c ca="center">
                        <p>0.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Mastitis mammary</p>
                     </c>
                     <c ca="center">
                        <p>615</p>
                     </c>
                     <c ca="center">
                        <p>0.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Whole genome</p>
                     </c>
                     <c ca="center">
                        <p>14,354</p>
                     </c>
                     <c ca="center">
                        <p>0.16</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>Given the taxonomic diversity of milk composition, we expected that the processes of lactation would be under stronger selective pressure than the genes that give rise to proteins in milk. However, the average d<sub>N</sub>/d<sub>S </sub>of the milk protein gene set was similar to that of the lactation mammary gene set (Table <tblr tid="T4">4</tblr>). This result suggests that species-specific variation in milk composition is primarily due to mechanisms other than milk and mammary protein sequence variation.</p>
            <p>Next, milk and mammary genes were evaluated for positive selection. A gene is inferred to be subject to positive selection when d<sub>N</sub>/d<sub>S </sub>is significantly greater than 1. Of the 6,530 genes from the milk protein and mammary gene sets, only two bovine genes with d<sub>N</sub>/d<sub>S </sub>>1 were significant under the likelihood ratio test (see 'Evolution analysis under the bovine lineage' in Materials and methods): <it>ADP-ribosyltransferase 4 </it>(<it>ART4</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="AJ291442">AJ291442</ext-link>] and <it>prenylcysteine oxidase 1 </it>(<it>PCYOX1</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_001105474">NM_001105474</ext-link>]. The <it>ART4 </it>gene product, which has previously been reported to be subject to positive selection in cattle <abbrgrp><abbr bid="B51">51</abbr></abbrgrp>, is an erythrocyte protein that carries antigens to the Dombrock blood group. <it>PCYOX1 </it>produces a protein that degrades a variety of prenylcysteines. Using RT-PCR to determine <it>PCYOX1 </it>and <it>ART4 </it>mRNA levels in alveolar mammary tissue from virgin, prepartum, lactating, involuting and dried-off cows (Additional data file 22), we found that <it>PCYOX1 </it>and <it>ART4 </it>are not differentially expressed in these tissues. The accelerated evolution of these genes may be unrelated to mammary biology.</p>
            <p>Two abundant milk protein genes, <it>beta-casein </it>(<it>CSN2</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_181008">NM_181008</ext-link>] and <it>kappa-casein </it>(<it>CSN3</it>) [GenBank:<ext-link ext-link-type="gen" ext-link-id="NM_174294">NM_174294</ext-link>], were among those with d<sub>N</sub>/d<sub>S </sub>>1, but they were not statistically significant under the likelihood ratio test (see 'Evolution analysis along the bovine lineage' in Materials and methods). The requirement that the entire gene shows statistical evidence of positive selection may be too stringent. Evidence of positive selection within the family Bovidae has been previously detected in a 34-codon region of <it>CSN3 </it><abbrgrp><abbr bid="B52">52</abbr></abbrgrp>. Further site-specific evolutionary analysis of the casein genes may be warranted.</p>
            <p>Despite the domestication of cattle for milk production, breeding regimes have not caused the apparent accelerated evolution of even a single milk protein or member of the lactation mammary gene set. Furthermore, milk and mammary genes are undergoing stronger purifying selection than other genes in the bovine genome. It has previously been theorized that the evolution of the mammary gland has been subject to forces that maximize the survival of the mother-child pair <abbrgrp><abbr bid="B53">53</abbr></abbrgrp>. Because all components in the milk are produced at the expense of the mother, it can be argued that few superfluous components would survive evolution. Our findings are consistent with this hypothesis. Genes encoding milk components and other genes expressed in the mammary gland were found to be under significant negative selection compared to the whole genome, highlighting the essentiality of milk in mammalian evolution.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusions</p>
         </st>
         <p>The availability of the <it>B. taurus </it>genome sequence assembly marks the beginning of a new era for the study of milk and mammary biology. Using this assembly, we identified 197 unique milk protein genes and over 6,000 mammary-related genes distributed across all bovine chromosomes. Intersecting these genes with 238 curated milk-trait QTL, we reduced the search space for milk trait effectors by more than an order of magnitude.</p>
         <p>Comparing genes of seven mammalian species, we found that more milk and mammary genes are present in all mammals and more were duplicated after the common ancestor with platypus than other genes in the bovine genome. We also found that, on average, milk and mammary genes are more conserved than other genes among mammals and are evolving more slowly than other genes in the bovine genome. The higher conservation of these genes, as well as the strong negative selection and absence of positive selection, supports the hypothesis that the evolution of milk has been constrained to maximize the survival of both mother and offspring.</p>
         <p>Our findings also suggest that the species-specific variation in milk composition is primarily due to mechanisms other than protein sequence variation. Variation in copy number of the milk protein genes may contribute to the taxonomic diversity of milk composition, as exemplified by duplications of some immune-related milk proteins. Additional mechanisms, such as transcriptional and translational regulation of genes expressed in the mammary gland as well as other organs involved in energy partitioning may be larger contributors to milk composition variation. In future studies, non-coding regions of the genome, particularly those with putative regulatory function, will need to be explored as potential sources of species-specific variation in milk composition.</p>
         <p>We found that mammary genes are co-localized in the bovine genome, implying co-regulation of expression in mammary epithelial cells. Our study of the most complete milk proteome to date demonstrates that milk proteins do not generally cluster with each other, but do cluster with mammary genes, and therefore are likely co-regulated. The casein proteins are therefore unique among the milk protein genes in both their divergence between species and in their genomic organization.</p>
         <p>Across the seven mammalian genomes, we found that the most divergent milk proteins are known to have nutritional and immunological properties, whereas the most conserved are within the milk fat globule proteome. The high conservation of genes apparently involved in milk fat globule secretion suggests that the cellular anatomy of secretion may be conserved across species and likely shared among secretory organs. Likewise, the higher conservation of mammary genes, compared with other genes, suggests that the ontogeny of the mammary gland occurred by co-opting existing structures and developmental pathways. Lactation may be less than 200 million years old, but its biological roots are far more ancient.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Collection of the milk protein gene set</p>
            </st>
            <p>Amino acid sequences corresponding to the protein identifiers reported in two proteomic studies <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp> were collected from SwissProt, UniRef, TREMBL, and NCBI databases. A custom track of the bovine consensus gene models <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>, or 'GLEAN' models, was created and uploaded to the University of California Santa Cruz (UCSC) Genome Browser <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>. The milk protein amino acid sequences were aligned against the bovine genome draft 3.1, also known as 'Aug. 2006,' using BLAT <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>. The best scoring hits were manually reviewed against the custom GLEAN track in the UCSC Genome Browser. From the protein sequence identifiers in the Smolenski and Reinhardt studies <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>, 189 unique milk proteins were mapped to GLEAN IDs. The GLEAN IDs corresponding to the six most abundant milk proteins, alpha-S1-casein, alpha-S2-casein, beta-casein, kappa-casein, LGB, and LALBA, were also added to this gene set. Additionally, a script was written to identify genes in the bovine annotation database annotated by the lactation group that did not already exist in our milk protein gene set. Those genes were then manually screened for proteins known to be in milk. Two additional proteins were identified: lactotransferrin and secreted phosphoprotein 1 (osteopontin). In total, the milk protein gene set consists of 197 unique genes that encode proteins known to be in bovine milk (Additional data files 1 and 2).</p>
         </sec>
         <sec>
            <st>
               <p>Collection of the mammary gene sets</p>
            </st>
            <p>Bovine mammary gland EST libraries available through the NCBI EST database <abbrgrp><abbr bid="B56">56</abbr></abbrgrp> were surveyed to define condition- or developmental stage-specific mammary gene sets. Descriptions of the EST libraries used as well as reasons for exclusion of other EST libraries are given in Additional data file 21. The EST libraries used include the BMGA, BMLB, BMPA, BMUA, and BMVB libraries developed by AgResearch Ltd and Genesis Ltd in New Zealand as well as the FNM and FLM libraries developed by ViaLactia Biosciences Ltd in New Zealand. Custom tracks for the UCSC Genome and Table Browsers <abbrgrp><abbr bid="B54">54</abbr><abbr bid="B57">57</abbr></abbrgrp> were created for all GLEAN models from the bovine genome project <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> and for all of these EST libraries. The intersection filter of the UCSC Table Browser was used to identify the GLEAN models that overlapped with ESTs in these libraries. Mammary gene sets were defined as follows: virgin = (BMVB or FNM); pregnancy = BMPA; lactation = (BMGA or FLM); involution = BMLB; and mastitis = BMUA. In total, these mammary gene sets contain 6,469 unique genes derived from over 94,000 ESTs. Gene identifiers for the genes that comprise each mammary gene set are given in the spreadsheets of Additional data file 1. UCSC custom tracks of these genes sets are provided in Additional data files 3-7.</p>
         </sec>
         <sec>
            <st>
               <p>Gene Ontology analysis</p>
            </st>
            <p>Bovine genes from the milk protein and mammary gene sets were mapped to human orthologs using a three-way reciprocal best BLAST hit approach between human, mouse, and bovine as implemented in the 'Ortholuge' program <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Using GO-Elite version 1.17 beta <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>, the human orthologs of milk and mammary genes were analyzed for over-represented GO terms compared with the full set of human orthologs. GO-Elite calculates a Fisher's exact test z-score for unique genes corresponding to a GO term from the user's input list compared with the reference list. To calculate a <it>P</it>-value for each GO term, GO-Elite randomly selects the same number of input genes or probe sets in the user's input gene list from the reference list 2,000 times to determine the likelihood of obtaining a z-score greater than or equal to the empirically derived z-score. To adjust for multiple hypothesis testing, the Benjamini-Hochberg correction is used to calculate an adjusted <it>P</it>-value. GO-Elite determines the set of minimally redundant significant GO terms by examining the scores and relative positions of all high-scoring terms within the hierarchy to select those terms that maximally describe the biology without removing valuable information. GO terms with an adjusted <it>P</it>-value &#8804; 0.05 were taken to be significant.</p>
         </sec>
         <sec>
            <st>
               <p>Pathway analysis</p>
            </st>
            <p>Ingenuity Pathways Analysis <abbrgrp><abbr bid="B60">60</abbr></abbrgrp> was used to identify metabolic and signaling pathways that are over-represented by the human orthologs of milk and lactation-related bovine genes compared with the human orthologs of all of the genes from the bovine consensus gene model (GLEAN) set. The Ingenuity Pathways Analysis library of canonical pathways includes 80 metabolic and 72 signaling pathways that have been incorporated from various resources and hand-curated. A Fischer's exact test was used to calculate a <it>P</it>-value to determine the probability that the enrichment of the canonical pathway with the gene set of interest is explained by chance alone. In this paper, this <it>P</it>-value is referred to as the unadjusted <it>P</it>-value. Enriched pathways with an unadjusted <it>P</it>-value &#8804; 0.05 and associated with at least three genes of interest are referred to as marginally significant. To improve the stringency of the test, a Benjamini and Hochberg multiple testing correction was applied to the unadjusted <it>P</it>-values with a custom R script using the multtest library <abbrgrp><abbr bid="B61">61</abbr><abbr bid="B62">62</abbr></abbrgrp>. Pathways reported to be statistically significant were those with a Benjamini and Hochberg adjusted <it>P</it>-value &#8804; 0.05.</p>
         </sec>
         <sec>
            <st>
               <p>Genomic localization analysis</p>
            </st>
            <p>The bovine genome was explored for clusters of milk and lactation-related genes that are more proximal to each other in the genome than would be expected by chance. Using the method developed by Salomonis <it>et al</it>. <abbrgrp><abbr bid="B63">63</abbr></abbrgrp>, 500 kb windows on the genome that start in the same position as a gene were tested as candidate co-location clusters. For each such candidate cluster, a list of genes that overlap the window was assembled. Strand information was ignored, so that a gene was considered to start at its lowest coordinate. Genomic sequence not assembled to chromosomes was excluded.</p>
            <p>For each of the milk protein and mammary gene sets, the statistically expected number of genes from the cluster in the gene set was calculated, given the number of genes on chromosomes both inside and outside of the gene set and using a hypergeometric distribution. Genes were considered to comprise a co-location cluster if there were at least three non-paralogous genes of interest in the region and the number of candidate cluster genes from the gene sets was significantly higher than chance (<it>P </it>&#8804; 0.05). A multiple test correction against all the clusters was performed with a Benjamini and Hochberg false discovery rate <abbrgrp><abbr bid="B61">61</abbr><abbr bid="B62">62</abbr></abbrgrp>. When multiple clusters contained the same genes or subsets of genes, the cluster with the lowest <it>P</it>-value was reported.</p>
         </sec>
         <sec>
            <st>
               <p>Orthology delineation</p>
            </st>
            <p>Orthologs of the milk and mammary genes were filtered from the whole genome ortholog set <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. Briefly, groups of orthologous genes were automatically identified using a previously employed strategy <abbrgrp><abbr bid="B64">64</abbr></abbrgrp> that is based on all-against-all protein sequence comparisons using the Smith-Waterman algorithm, followed by clustering of best reciprocal hits from highest scoring ones to 10<sup>-3 </sup>e-value cutoff for triangulating best reciprocal hits or 10<sup>-6 </sup>cutoff for unsupported best reciprocal hits, and requiring a sequence alignment overlap of at least 30 amino acids across all members of a group. Furthermore, the orthologous groups were expanded by genes that are more similar to each other within a proteome than to any gene in any of the other species, and by very similar copies that share over 97% sequence identity. The procedure was applied to the initial bovine set of consensus gene models <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> and to the longest transcript per gene of the Ensembl v.45 <abbrgrp><abbr bid="B65">65</abbr></abbrgrp> gene sets of human, mouse, rat, dog, opossum, and platypus.</p>
         </sec>
         <sec>
            <st>
               <p>Curation of milk protein orthologs</p>
            </st>
            <p>Orthologs of milk protein genes (see 'Orthology delineation' above) were curated manually if they were uniquely duplicated in <it>B. taurus </it>or missing copies in one or more of the placental mammals. Fifteen genes uniquely duplicated in <it>B. taurus </it>were removed from the curated ortholog set for the following reasons: four were pseudogenes - gene duplicates without introns; four were not assembled on a chromosome and, therefore, likely to represent reading of the same sequence; and seven were a result of an assembly error or poor GLEAN prediction. The pseudogenes identified were those of PFN1 (GLEAN_02143), RAB18 (GLEAN_21462), RAP1B (GLEAN_10112), and YWHAZ (GLEAN_11922). A perfect duplicate of GAPDH (GLEAN_13969) that exists in both Btau 3.1 and 4.0 assemblies was retained, but further research is needed to determine if it is a true expansion. To find missing orthologs of milk protein genes in placental mammals, the Ensembl databases of those species with orthologs not found by automated detection were searched using BLAST and the bovine consensus gene and protein sequences. Additional known orthologs were collected from UniProt. In total, 15 erroneous duplicate genes and 37 missing orthologs were identified through manual curation. This curated ortholog set is available in Additional data file 19.</p>
            <p>For conservation analyses, amino acid sequences of bovine genes annotated as erroneous in the bovine genome annotation database <abbrgrp><abbr bid="B66">66</abbr></abbrgrp> were replaced with manually curated full-length sequences from UniProt <abbrgrp><abbr bid="B67">67</abbr></abbrgrp>. Replaced sequences are indicated by the following accession format in Tables <tblr tid="T2">2</tblr> and <tblr tid="T3">3</tblr>: GLEAN_ID_ACCESSION where ACCESSION is the UniProt accession for the replacement amino acid sequence and GLEAN_ID is the bovine gene model identifier for the original sequence.</p>
         </sec>
         <sec>
            <st>
               <p>Milk protein gene copy clustering and visualization</p>
            </st>
            <p>Perl and shell scripts were written to create input files for the clustering tool, Cluster version 2.20 <abbrgrp><abbr bid="B68">68</abbr></abbrgrp>. A K-means clustering algorithm was applied in Cluster, and the resulting clusters were seriated using a multiple-fragment heuristic in PermutMatrix <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. Whether or not clustering was applied, all heatmaps were seriated and visualized in PermutMatrix.</p>
         </sec>
         <sec>
            <st>
               <p>Consensus tree construction</p>
            </st>
            <p>Single copy ortholog identifiers of milk protein genes were extracted from the whole genome set of orthologous clusters (see 'Orthology delineation' in Materials and methods). Amino acid sequences for these identifiers were downloaded from the Ensembl database release 45 <abbrgrp><abbr bid="B70">70</abbr></abbrgrp>. Multiple alignments of the milk proteins were constructed using MUSCLE <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>. The multiple alignments were then concatenated into a super-alignment that was used to create a maximum likelihood consensus tree with PhyML <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp>. The tree was constructed based on the JTT model of amino acid sequence evolution <abbrgrp><abbr bid="B74">74</abbr></abbrgrp> with rates assumed to vary among sites according to a gamma distribution. Support for the tree's nodes is given by 100 bootstraps.</p>
         </sec>
         <sec>
            <st>
               <p>Statistical analysis of PID distributions</p>
            </st>
            <p>A Wilcoxon rank sum test with continuity correction (Mann-Whitney U) from the R programming language was used to determine if the mean of the average PIDs across the seven taxa of each milk and lactation gene set is statistically different from the whole genome. A two-sample Kolmogorov-Smirnov test was used to determine if the average PIDs of milk and mammary genes are drawn from the same distribution as the genome. Significance was determined by a <it>P</it>-value &#8804; 0.05.</p>
         </sec>
         <sec>
            <st>
               <p>Evolution analysis along the bovine lineage</p>
            </st>
            <p>For this analysis only, putative orthology was assigned using a three-way reciprocal best BLAST hit approach as implemented in the 'Ortholuge' program <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Ortholog sequences for the caseins and alpha-lactalbumin were manually curated. For each gene, d<sub>N</sub>/d<sub>S </sub>ratios were estimated from coding sequence alignments of the human-mouse-bovine orthologs by maximum likelihood using the codeml program from PAMLv4 <abbrgrp><abbr bid="B75">75</abbr></abbrgrp>. Two models were implemented to test the statistical significance of variable selective pressures on each lineage. Under the one-ratio model, which acts as the null model (NSsites = 0, model = 0), each lineage was modeled to have the same d<sub>N</sub>/d<sub>S </sub>ratio. The ratio is constrained between 0 and 1, and does not allow for the presence of positive selection. The second model is a model of bovine-specific evolution, where the bovine lineage was selected as the 'foreground' lineage and d<sub>N</sub>/d<sub>S </sub>was specifically allowed to vary unconstrained on this lineage (model = 2). The two models were compared by likelihood ratio test, calculated from the log likelihood (lnL) values of both models. Twice the difference between lnL<sub>model 2 </sub>and lnL<sub>one-ratio </sub>was compared with a chi-square distribution to obtain the <it>P</it>-values.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>d<sub>N</sub>: rate of non-synonymous substitutions per non-synonymous site; d<sub>S</sub>: rate of synonymous substitutions per synonymous site; EST: expressed sequence tag; LALBA: alpha-lactalbumin; LGB: beta-lactoglobulin; GO: Gene Ontology; PAEP: progestagen-associated endometrial protein; PID: percent identity; QTL: quantitative trait loci; UCSC: University of California at Santa Cruz.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>DGL and MR conceived of the study and participated in its design and coordination. DJL conducted evolutionary analyses. WFM and DGL performed genome localization analyses. EMZ and EVK provided orthology delineation. DGL, EVK, and NJM conducted phylogenetic experiments. JFM and GR curated milk protein orthologs and milk trait QTL. WCB produced the chromosome map. ASH created custom tracks for the UCSC Genome Browser. KS and RM conducted RT-PCR assays and prepared Additional data file 22. DGL produced the milk and mammary gene lists and conducted all other analyses. KSP supervised statistical analyses. DGL, TMC, MCN, AJM, RLT, and MR interpreted data. DGL, TMC, MCN, and MR drafted the manuscript. All authors contributed to and approved the final manuscript.</p>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper. Additional data file <supplr sid="S1">1</supplr> is an Excel file with one spreadsheet listing the genes in each of the milk and mammary gene sets and their annotations. Additional data file <supplr sid="S2">2</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the milk protein gene set. Additional data file <supplr sid="S3">3</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the virgin mammary gene set. Additional data file <supplr sid="S4">4</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the pregnancy mammary gene set. Additional data file <supplr sid="S5">5</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the lactation mammary gene set. Additional data file <supplr sid="S6">6</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the involution mammary gene set. Additional data file <supplr sid="S7">7</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the mastitis mammary gene set. Additional data file <supplr sid="S8">8</supplr> is an Excel file that lists genomic locations of curated milk trait QTL. Additional data file <supplr sid="S9">9</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of curated milk trait QTL. Additional data file <supplr sid="S10">10</supplr> is a Word document that provides additional analysis and discussion of milk trait QTL density. Additional data file <supplr sid="S11">11</supplr> is an Excel file that lists candidate genes that occur within QTL with one spreadsheet per milk trait. Additional data file <supplr sid="S12">12</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of candidate genes associated with the 'fat percentage' trait. Additional data file <supplr sid="S13">13</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of candidate genes associated with the 'fat yield' trait. Additional data file <supplr sid="S14">14</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of candidate genes associated with the 'milk yield' trait. Additional data file <supplr sid="S15">15</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of candidate genes associated with the 'protein percentage' trait. Additional data file <supplr sid="S16">16</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists genomic locations of candidate genes associated with the 'protein yield' trait. Additional data file <supplr sid="S17">17</supplr> is an Excel file that lists the significant genomic clusters within each milk and mammary gene set. Additional data file <supplr sid="S18">18</supplr> is a custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1, that lists the genome locations of the significant genomic clusters. Additional data file <supplr sid="S19">19</supplr> is an Excel file that lists accession numbers of mammalian orthologs of bovine milk protein genes. Additional data file <supplr sid="S20">20</supplr> is a Word document that provides more detail on the conservation of milk protein genes in mammals. Additional data file <supplr sid="S21">21</supplr> is an Excel spreadsheet that lists the EST libraries that were surveyed for this study, the number of ESTs in each library, a description of the physiological state of the animal and tissue used to derive the library, and, if the library was excluded from this study, the reason for exclusion. Additional data file <supplr sid="S22">22</supplr> is a Word document that details the methods used to probe relative mRNA levels of <it>LGB-II</it>, <it>PCYOX1</it>, and <it>ART4 </it>in bovine mammary tissue at different stages of development and the RT-PCR results.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Milk and mammary gene sets</p>
            </caption>
            <text>
               <p>Milk and mammary gene sets.</p>
            </text>
            <file name="gb-2009-10-4-r43-S1.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Genome locations of milk protein gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S2.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Genome locations of virgin mammary gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S3.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Genome locations of pregnancy mammary gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S4.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>Genome locations of lactation mammary gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S5.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>Genome locations of involution mammary gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S6.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>Genome locations of mastitis mammary gene set</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S7.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S8">
            <title>
               <p>Additional data file 8</p>
            </title>
            <caption>
               <p>Curated milk trait QTL</p>
            </caption>
            <text>
               <p>Genomic locations of curated milk trait QTL</p>
            </text>
            <file name="gb-2009-10-4-r43-S8.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S9">
            <title>
               <p>Additional data file 9</p>
            </title>
            <caption>
               <p>Genomic locations of milk trait QTL</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S9.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S10">
            <title>
               <p>Additional data file 10</p>
            </title>
            <caption>
               <p>Milk trait QTL density</p>
            </caption>
            <text>
               <p>Additional analysis and discussion of milk trait QTL density</p>
            </text>
            <file name="gb-2009-10-4-r43-S10.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S11">
            <title>
               <p>Additional data file 11</p>
            </title>
            <caption>
               <p>Milk trait candidate genes</p>
            </caption>
            <text>
               <p>Candidate genes that occur within QTL with one spreadsheet per milk trait</p>
            </text>
            <file name="gb-2009-10-4-r43-S11.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S12">
            <title>
               <p>Additional data file 12</p>
            </title>
            <caption>
               <p>Genomic locations of 'fat percentage' candidate genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S12.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S13">
            <title>
               <p>Additional data file 13</p>
            </title>
            <caption>
               <p>Genomic locations of 'fat yield' candidate genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S13.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S14">
            <title>
               <p>Additional data file 14</p>
            </title>
            <caption>
               <p>Genomic locations of 'milk yield' candidate genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S14.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S15">
            <title>
               <p>Additional data file 15</p>
            </title>
            <caption>
               <p>Genomic locations of 'protein percentage' candidate genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S15.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S16">
            <title>
               <p>Additional data file 16</p>
            </title>
            <caption>
               <p>Genomic locations of 'protein yield' candidate genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S16.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S17">
            <title>
               <p>Additional data file 17</p>
            </title>
            <caption>
               <p>Milk and mammary genes co-located in the genome</p>
            </caption>
            <text>
               <p>Significant genomic clusters within each milk and mammary gene set</p>
            </text>
            <file name="gb-2009-10-4-r43-S17.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S18">
            <title>
               <p>Additional data file 18</p>
            </title>
            <caption>
               <p>Genomic locations of co-located milk and mammary genes</p>
            </caption>
            <text>
               <p>Custom track in BED format for the UCSC Genome Browser, bovine assembly 3.1.</p>
            </text>
            <file name="gb-2009-10-4-r43-S18.bed">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S19">
            <title>
               <p>Additional data file 19</p>
            </title>
            <caption>
               <p>Mammalian orthologs of bovine milk protein genes</p>
            </caption>
            <text>
               <p>Accession numbers of mammalian orthologs of bovine milk protein genes</p>
            </text>
            <file name="gb-2009-10-4-r43-S19.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S20">
            <title>
               <p>Additional data file 20</p>
            </title>
            <caption>
               <p>Conservation of milk protein genes in mammals</p>
            </caption>
            <text>
               <p>More detail on the conservation of milk protein genes in mammals</p>
            </text>
            <file name="gb-2009-10-4-r43-S20.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S21">
            <title>
               <p>Additional data file 21</p>
            </title>
            <caption>
               <p>EST library descriptions</p>
            </caption>
            <text>
               <p>EST libraries that were surveyed for this study, the number of ESTs in each library, a description of the physiological state of the animal and tissue used to derive the library, and, if the library was excluded from this study, the reason for exclusion.</p>
            </text>
            <file name="gb-2009-10-4-r43-S21.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S22">
            <title>
               <p>Additional data file 22</p>
            </title>
            <caption>
               <p>RT-PCR methods and results</p>
            </caption>
            <text>
               <p>Methods used to probe relative mRNA levels of <it>LGB-II</it>, <it>PCYOX1</it>, and <it>ART4 </it>in bovine mammary tissue at different stages of development and the RT-PCR results.</p>
            </text>
            <file name="gb-2009-10-4-r43-S22.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The authors acknowledge Cora J Dillard for editorial assistance with the manuscript, David Adelson for providing milk trait QTL from the Bovine QTL viewer, and Chris Elsik for providing the bovine consensus gene model (GLEAN) sequences. The authors would also like to acknowledge Tom Wheeler, Timothy Reinhardt, and W James Kent for helpful comments. DGL, WFM, and JBG are supported by the International Milk Genomics Consortium, NIEHS Superfund grant P42 ES04699, and by the CHARGE study grant P01 ES11269. MR is funded by the USDA Agricultural Research Service 6250-51000-048. MCN is supported by NIH PO1-HD38129 to MCN. AJM, NJM, KS, and RM are funded by the Foundation for Research Science and Technology from the New Zealand Government. JFM and GR are supported by the California Dairy Research Foundation Project No. 05 MEJ-01-NH to JFM. ASH is supported by the National Human Genome Research Institute 2 P41 HG002371-06. DJL is funded by Genome Canada and Genome BC through the Pathogenomics of Innate Immunity (PI2) project and holds a Postdoctoral Trainee Award from the Michael Smith Foundation for Health Research. EMZ and EVK are supported by the Swiss National Science Foundation 3100A0-112588. RLT is supported by Australia's Cooperative Research Centre for Innovative Dairy Products and the Gardiner Foundation.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>The mammary gland and its origin during synapsid evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Oftedal</snm>
                  <fnm>OT</fnm>
               </au>
            </aug>
            <source>J Mammary Gland Biol Neoplasia</source>
            <pubdate>2002</pubdate>
            <volume>7</volume>
            <fpage>225</fpage>
            <lpage>252</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12751889</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The delayed rise of present-day mammals.</p>
            </title>
            <aug>
               <au>
                  <snm>Bininda-Emonds</snm>
                  <fnm>ORP</fnm>
               </au>
               <au>
                  <snm>Cardillo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>MacPhee</snm>
                  <fnm>RDE</fnm>
               </au>
               <au>
                  <snm>Beck</snm>
                  <fnm>RMD</fnm>
               </au>
               <au>
                  <snm>Grenyer</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Price</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Vos</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Gittleman</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Purvis</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>446</volume>
            <fpage>507</fpage>
            <lpage>512</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17392779</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Characterizing the chromosomes of the platypus (<it>Ornithorhynchus anatinus</it>).</p>
            </title>
            <aug>
               <au>
                  <snm>McMillan</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Miethke</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Alsop</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rens</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>O'Brien</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Trifonov</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Veyrunes</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Schatzkamer</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kremitzki</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Graves</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Warren</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gr&#252;tzner</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Ferguson-Smith</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Graves</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Chromosome Res</source>
            <pubdate>2007</pubdate>
            <volume>15</volume>
            <fpage>961</fpage>
            <lpage>974</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18185982</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <aug>
               <au>
                  <snm>Grant</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>The Platypus: A Unique Mammal</source>
            <publisher>Sydney, Australia: UNSW Press</publisher>
            <pubdate>1995</pubdate>
         </bibl>
         <bibl id="B5">
            <aug>
               <au>
                  <snm>Krause</snm>
                  <fnm>WJ</fnm>
               </au>
               <au>
                  <snm>Krause</snm>
                  <fnm>WA</fnm>
               </au>
            </aug>
            <source>The Opossum: Its Amazing Story</source>
            <publisher>University of Missouri, Columbia, Department of Pathology and Anatomical Sciences</publisher>
            <pubdate>2006</pubdate>
            <url>http://web.missouri.edu/~krausew/Histology/Home_files/opossum.pdf</url>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Use of maternal reserves as a lactation strategy in large mammals.</p>
            </title>
            <aug>
               <au>
                  <snm>Oftedal</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Proc Nutr Soc</source>
            <pubdate>2000</pubdate>
            <volume>59</volume>
            <fpage>99</fpage>
            <lpage>106</lpage>
            <xrefbib>
               <pubid idtype="pmpid">10828179</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Independent introduction of two lactase-persistence alleles into human populations reflects different history of adaptation to milk culture.</p>
            </title>
            <aug>
               <au>
                  <snm>Enattah</snm>
                  <fnm>NS</fnm>
               </au>
               <au>
                  <snm>Jensen</snm>
                  <fnm>TG</fnm>
               </au>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lewinski</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kuokkanen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rasinpera</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>El-Shanti</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Seo</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Alifrangis</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Khalil</snm>
                  <fnm>IF</fnm>
               </au>
               <au>
                  <snm>Natah</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ali</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Natah</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Comas</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mehdi</snm>
                  <fnm>SQ</fnm>
               </au>
               <au>
                  <snm>Groop</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Vestergaard</snm>
                  <fnm>EM</fnm>
               </au>
               <au>
                  <snm>Imtiaz</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Rashed</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Meyer</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Troelsen</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Peltonen</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Am J Hum Genet</source>
            <pubdate>2008</pubdate>
            <volume>82</volume>
            <fpage>57</fpage>
            <lpage>72</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2253962</pubid>
                  <pubid idtype="pmpid">18179885</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Structure and function of milk protein genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Mercier</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Vilotte</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>J Dairy Sci</source>
            <pubdate>1993</pubdate>
            <volume>76</volume>
            <fpage>3079</fpage>
            <lpage>3098</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8227632</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Multispecies comparison of the casein gene loci and evolution of casein gene family.</p>
            </title>
            <aug>
               <au>
                  <snm>Rijnkels</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>J Mammary Gland Biol Neoplasia</source>
            <pubdate>2002</pubdate>
            <volume>7</volume>
            <fpage>327</fpage>
            <lpage>345</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12751895</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Multispecies comparative analysis of a mammalian-specific genomic domain encoding secretory proteins.</p>
            </title>
            <aug>
               <au>
                  <snm>Rijnkels</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Elnitski</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Rosen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>2003</pubdate>
            <volume>82</volume>
            <fpage>417</fpage>
            <lpage>432</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">13679022</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Characterisation of host defence proteins in milk using a proteomic approach.</p>
            </title>
            <aug>
               <au>
                  <snm>Smolenski</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Haines</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kwan</snm>
                  <fnm>FY</fnm>
               </au>
               <au>
                  <snm>Bond</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Farr</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Stelwagen</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wheeler</snm>
                  <fnm>TT</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2007</pubdate>
            <volume>6</volume>
            <fpage>207</fpage>
            <lpage>215</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17203965</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Bovine milk fat globule membrane proteome.</p>
            </title>
            <aug>
               <au>
                  <snm>Reinhardt</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Lippolis</snm>
                  <fnm>JD</fnm>
               </au>
            </aug>
            <source>J Dairy Res</source>
            <pubdate>2006</pubdate>
            <volume>73</volume>
            <fpage>406</fpage>
            <lpage>416</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16834814</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Soluble CD14 in human breast milk and its role in innate immune responses.</p>
            </title>
            <aug>
               <au>
                  <snm>Vidal</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Labeta</snm>
                  <fnm>MO</fnm>
               </au>
               <au>
                  <snm>Schiffrin</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Donnet-Hughes</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Acta Odontol Scand</source>
            <pubdate>2001</pubdate>
            <volume>59</volume>
            <fpage>330</fpage>
            <lpage>334</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11680654</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Soluble forms of Toll-like receptor (TLR)2 capable of modulating TLR2 signaling are present in human plasma and breast milk.</p>
            </title>
            <aug>
               <au>
                  <snm>LeBouder</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Rey-Nores</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Rushmere</snm>
                  <fnm>NK</fnm>
               </au>
               <au>
                  <snm>Grigorov</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lawn</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Affolter</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Griffin</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Ferrara</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Schiffrin</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Morgan</snm>
                  <fnm>BP</fnm>
               </au>
               <au>
                  <snm>Lab&#233;ta</snm>
                  <fnm>MO</fnm>
               </au>
            </aug>
            <source>J Immunol</source>
            <pubdate>2003</pubdate>
            <volume>171</volume>
            <fpage>6680</fpage>
            <lpage>6689</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">14662871</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p><it>In vitro </it>digestion of novel milk protein ingredients for use in infant formulas: research on biological functions.</p>
            </title>
            <aug>
               <au>
                  <snm>Chatterton</snm>
                  <fnm>DEW</fnm>
               </au>
               <au>
                  <snm>Rasmussen</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Heegaard</snm>
                  <fnm>CW</fnm>
               </au>
               <au>
                  <snm>Sorensen</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Petersen</snm>
                  <fnm>TE</fnm>
               </au>
            </aug>
            <source>Trends Food Sci Technol</source>
            <pubdate>2004</pubdate>
            <volume>15</volume>
            <fpage>373</fpage>
            <lpage>383</lpage>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Food-derived peptides and intestinal functions.</p>
            </title>
            <aug>
               <au>
                  <snm>Shimizu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Son</snm>
                  <fnm>DO</fnm>
               </au>
            </aug>
            <source>Curr Pharm Des</source>
            <pubdate>2007</pubdate>
            <volume>13</volume>
            <fpage>885</fpage>
            <lpage>895</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17430188</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>The milk lipid globule membrane.</p>
            </title>
            <aug>
               <au>
                  <snm>Keenan</snm>
                  <fnm>TW</fnm>
               </au>
               <au>
                  <snm>Patton</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Handbook of Milk Composition</source>
            <publisher>Academic Press, Inc</publisher>
            <editor>Jensen RG</editor>
            <pubdate>1995</pubdate>
            <fpage>5</fpage>
            <lpage>50</lpage>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Gene regulatory networks in lactation: identification of global principles using bioinformatics.</p>
            </title>
            <aug>
               <au>
                  <snm>Lemay</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Neville</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Rudolph</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Pollard</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>German</snm>
                  <fnm>JB</fnm>
               </au>
            </aug>
            <source>BMC Syst Biol</source>
            <pubdate>2007</pubdate>
            <volume>1</volume>
            <fpage>56</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2225983</pubid>
                  <pubid idtype="pmpid" link="fulltext">18039394</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>A meta-analysis of quantitative trait loci associated with body weight and adiposity in mice.</p>
            </title>
            <aug>
               <au>
                  <snm>Wuschke</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dahm</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Joost</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Al-Hasani</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Int J Obes (Lond)</source>
            <pubdate>2007</pubdate>
            <volume>31</volume>
            <fpage>829</fpage>
            <lpage>841</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17060928</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Genomic organization of transcriptomes in mammals: coregulation and cofunctionality.</p>
            </title>
            <aug>
               <au>
                  <snm>Purmann</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Toedling</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schueler</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carninci</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Lehrach</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Hayashizaki</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Huber</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Sperling</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>2007</pubdate>
            <volume>89</volume>
            <fpage>580</fpage>
            <lpage>587</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17369017</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Evolutionary dynamics of the immunoglobulin heavy chain variable region genes in vertebrates.</p>
            </title>
            <aug>
               <au>
                  <snm>Das</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Nozawa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Klein</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Nei</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Immunogenetics</source>
            <pubdate>2008</pubdate>
            <volume>60</volume>
            <fpage>47</fpage>
            <lpage>55</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2386433</pubid>
                  <pubid idtype="pmpid" link="fulltext">18196235</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Evolution and organization of the fibrinogen locus on chromosome 4: gene duplication accompanied by transposition and inversion.</p>
            </title>
            <aug>
               <au>
                  <snm>Kant</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Fornace</snm>
                  <fnm>AJ</fnm>
                  <suf>Jr</suf>
               </au>
               <au>
                  <snm>Saxe</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Simon</snm>
                  <fnm>MI</fnm>
               </au>
               <au>
                  <snm>McBride</snm>
                  <fnm>OW</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>GR</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1985</pubdate>
            <volume>82</volume>
            <fpage>2344</fpage>
            <lpage>2348</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">397554</pubid>
                  <pubid idtype="pmpid">2986113</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Chromatin remodelling is a major source of coexpression of linked genes in yeast.</p>
            </title>
            <aug>
               <au>
                  <snm>Batada</snm>
                  <fnm>NN</fnm>
               </au>
               <au>
                  <snm>Urrutia</snm>
                  <fnm>AO</fnm>
               </au>
               <au>
                  <snm>Hurst</snm>
                  <fnm>LD</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2007</pubdate>
            <volume>23</volume>
            <fpage>480</fpage>
            <lpage>484</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17822800</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>An abundant class of tiny RNAs with probable regulatory roles in <it>Caenorhabditis elegans </it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Lau</snm>
                  <fnm>NC</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>LP</fnm>
               </au>
               <au>
                  <snm>Weinstein</snm>
                  <fnm>EG</fnm>
               </au>
               <au>
                  <snm>Bartel</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2001</pubdate>
            <volume>294</volume>
            <fpage>858</fpage>
            <lpage>862</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11679671</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Characterisation of a second, apparently inactive, copy of the bovine beta-lactoglobulin gene.</p>
            </title>
            <aug>
               <au>
                  <snm>Passey</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Mackinlay</snm>
                  <fnm>AG</fnm>
               </au>
            </aug>
            <source>Eur J Biochem</source>
            <pubdate>1995</pubdate>
            <volume>233</volume>
            <fpage>736</fpage>
            <lpage>743</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8521836</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Horse alpha-1-antitrypsin, beta-lactoglobulins 1 and 2, and transferrin map to positions 24q15-q16, 28q18-qter, 28q18-qter and 16q23, respectively.</p>
            </title>
            <aug>
               <au>
                  <snm>Lear</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Brandon</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Masel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bell</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Bailey</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Chromosome Res</source>
            <pubdate>1999</pubdate>
            <volume>7</volume>
            <fpage>667</fpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10628669</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Isolation, sequencing and relative quantitation by fluorescent-ratio PCR of feline beta-lactoglobulin I, II, and III cDNAs.</p>
            </title>
            <aug>
               <au>
                  <snm>Pena</snm>
                  <fnm>RN</fnm>
               </au>
               <au>
                  <snm>Sanchez</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Coll</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Folch</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Mamm Genome</source>
            <pubdate>1999</pubdate>
            <volume>10</volume>
            <fpage>560</fpage>
            <lpage>564</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10341085</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Feline beta-lactoglobulins I, II and III, and canine beta-lactoglobulins I and II; amino acidic sequences provide evidence for the existence of more than one gene for beta-lactoglobulin in the cat and dog.</p>
            </title>
            <aug>
               <au>
                  <snm>Halliday</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Bell</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>McAndrew</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Shaw</snm>
                  <fnm>DC</fnm>
               </au>
            </aug>
            <source>Protein Sequences Data Analysis</source>
            <pubdate>1993</pubdate>
            <volume>5</volume>
            <fpage>201</fpage>
            <lpage>205</lpage>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Invited review: beta-lactoglobulin: binding properties, structure, and function.</p>
            </title>
            <aug>
               <au>
                  <snm>Kontopidis</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Holt</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Sawyer</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>J Dairy Sci</source>
            <pubdate>2004</pubdate>
            <volume>87</volume>
            <fpage>785</fpage>
            <lpage>796</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15259212</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>beta-Lactoglobulin.</p>
            </title>
            <aug>
               <au>
                  <snm>Hambling</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>McAlpine</snm>
                  <fnm>AS</fnm>
               </au>
               <au>
                  <snm>Sawyer</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Advances in Dairy Chemistry</source>
            <publisher>Proteins. Barking, Essex, UK: Elsevier</publisher>
            <editor>Fox PF</editor>
            <pubdate>1992</pubdate>
            <volume>I</volume>
            <fpage>141</fpage>
            <lpage>190</lpage>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Identification of alpha-lactalbumin and beta-lactoglobulin in cynomolgus monkey (<it>Macaca fascicularis</it>) milk.</p>
            </title>
            <aug>
               <au>
                  <snm>Azuma</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Yamauchi</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Comp Biochem Physiol B</source>
            <pubdate>1991</pubdate>
            <volume>99</volume>
            <fpage>917</fpage>
            <lpage>921</lpage>
            <xrefbib>
               <pubid idtype="pmpid">1790682</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Isolation and characterization of a 21 kDa whey protein in rhesus monkey (<it>Macaca mulatta</it>) milk.</p>
            </title>
            <aug>
               <au>
                  <snm>Kunz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Lonnerdal</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Comp Biochem Physiol Biochem Mol Biol</source>
            <pubdate>1994</pubdate>
            <volume>108</volume>
            <fpage>463</fpage>
            <lpage>469</lpage>
            <xrefbib>
               <pubid idtype="pmpid">7953066</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Characterization of baboon (<it>Papio hamadryas</it>) milk proteins.</p>
            </title>
            <aug>
               <au>
                  <snm>Hall</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Masel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bell</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Halliday</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Shaw</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>VandeBerg</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Biochem Genet</source>
            <pubdate>2001</pubdate>
            <volume>39</volume>
            <fpage>59</fpage>
            <lpage>71</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11444021</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Complete amino acid sequence of human placental protein 14: a progesterone-regulated uterine protein homologous to beta-lactoglobulins.</p>
            </title>
            <aug>
               <au>
                  <snm>Julkunen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Seppala</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Janne</snm>
                  <fnm>OA</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1988</pubdate>
            <volume>85</volume>
            <fpage>8845</fpage>
            <lpage>8849</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">282603</pubid>
                  <pubid idtype="pmpid">3194393</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Human placental protein 14 gene: sequence and characterization of a short duplication.</p>
            </title>
            <aug>
               <au>
                  <snm>Vaisse</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Atger</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Potier</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Milgrom</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>DNA Cell Biol</source>
            <pubdate>1990</pubdate>
            <volume>9</volume>
            <fpage>401</fpage>
            <lpage>413</lpage>
            <xrefbib>
               <pubid idtype="pmpid">2206398</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>The human placental protein 14 (PP14) gene is localized on chromosome 9q34.</p>
            </title>
            <aug>
               <au>
                  <snm>Van Cong</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Vaisse</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Gross</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Slim</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Milgrom</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Bernheim</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Hum Genet</source>
            <pubdate>1991</pubdate>
            <volume>86</volume>
            <fpage>515</fpage>
            <lpage>518</lpage>
            <xrefbib>
               <pubid idtype="pmpid">2016092</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Expression of glycodelin in human breast and breast cancer.</p>
            </title>
            <aug>
               <au>
                  <snm>Kamarainen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Halttunen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Koistinen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>von Boguslawsky</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>von Smitten</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>LC</fnm>
               </au>
               <au>
                  <snm>Seppala</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Int J Cancer</source>
            <pubdate>1999</pubdate>
            <volume>83</volume>
            <fpage>738</fpage>
            <lpage>742</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10597188</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Regulation of the glycosylated beta-lactoglobulin homolog, glycodelin [placental protein 14:(PP14)] in the baboon (<it>Papio anubis</it>) uterus.</p>
            </title>
            <aug>
               <au>
                  <snm>Hausermann</snm>
                  <fnm>HM</fnm>
               </au>
               <au>
                  <snm>Donnelly</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Bell</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Verhage</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Fazleabas</snm>
                  <fnm>AT</fnm>
               </au>
            </aug>
            <source>J Clin Endocrinol Metab</source>
            <pubdate>1998</pubdate>
            <volume>83</volume>
            <fpage>1226</fpage>
            <lpage>1233</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9543146</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Dynamics of mammalian chromosome evolution inferred from multispecies comparative maps.</p>
            </title>
            <aug>
               <au>
                  <snm>Murphy</snm>
                  <fnm>WJ</fnm>
               </au>
               <au>
                  <snm>Larkin</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Wind</snm>
                  <mnm>Everts-van der</mnm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bourque</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Tesler</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Auvil</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Beever</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Chowdhary</snm>
                  <fnm>BP</fnm>
               </au>
               <au>
                  <snm>Galibert</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Gatzke</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Hitte</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Meyers</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Milan</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Ostrander</snm>
                  <fnm>EA</fnm>
               </au>
               <au>
                  <snm>Pape</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Parker</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Raudsepp</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Rogatcheva</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>Schook</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Skow</snm>
                  <fnm>LC</fnm>
               </au>
               <au>
                  <snm>Welge</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Womack</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>O'brien</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Pevzner</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Lewin</snm>
                  <fnm>HA</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2005</pubdate>
            <volume>309</volume>
            <fpage>613</fpage>
            <lpage>617</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16040707</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>The conserved TFLK motif of mammary-associated serum amyloid A3 is responsible for up-regulation of intestinal MUC3 mucin expression <it>in vitro </it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Mack</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>McDonald</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Larson</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Weber</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Pediatr Res</source>
            <pubdate>2003</pubdate>
            <volume>53</volume>
            <fpage>137</fpage>
            <lpage>142</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12508093</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Human serum amyloid A3 peptide enhances intestinal MUC3 expression and inhibits EPEC adherence.</p>
            </title>
            <aug>
               <au>
                  <snm>Larson</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Weber</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mack</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>McDonald</snm>
                  <fnm>TL</fnm>
               </au>
            </aug>
            <source>Biochem Biophys Res Commun</source>
            <pubdate>2003</pubdate>
            <volume>300</volume>
            <fpage>531</fpage>
            <lpage>540</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12504116</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Serum amyloid A is an innate immune opsonin for Gram-negative bacteria.</p>
            </title>
            <aug>
               <au>
                  <snm>Shah</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hari-Dass</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Raynes</snm>
                  <fnm>JG</fnm>
               </au>
            </aug>
            <source>Blood</source>
            <pubdate>2006</pubdate>
            <volume>108</volume>
            <fpage>1751</fpage>
            <lpage>1757</lpage>
            <xrefbib>
               <pubid idtype="pmpid">16735604</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>The genome sequence of taurine cattle: a window to ruminant biology and evolution.</p>
            </title>
            <aug>
               <au>
                  <cnm>The Bovine Genome Sequencing and Analysis Consortium</cnm>
               </au>
               <au>
                  <snm>Elsik</snm>
                  <fnm>CG</fnm>
               </au>
               <au>
                  <snm>Tellam</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Worley</snm>
                  <fnm>KC</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2009</pubdate>
            <volume>324</volume>
            <fpage>522</fpage>
            <lpage>528</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">19390049</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Genome analysis of the platypus reveals unique signatures of evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Warren</snm>
                  <fnm>WC</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>LW</fnm>
               </au>
               <au>
                  <snm>Marshall Graves</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Ponting</snm>
                  <fnm>CP</fnm>
               </au>
               <au>
                  <snm>Grutzner</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Belov</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Chinwalla</snm>
                  <fnm>AT</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>SP</fnm>
               </au>
               <au>
                  <snm>Heger</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Locke</snm>
                  <fnm>DP</fnm>
               </au>
               <au>
                  <snm>Miethke</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Waters</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Veyrunes</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Fulton</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Fulton</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Graves</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Wallis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Puente</snm>
                  <fnm>XS</fnm>
               </au>
               <au>
                  <snm>L&#243;pez-Ot&#237;n</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ord&#243;&#241;ez</snm>
                  <fnm>GR</fnm>
               </au>
               <au>
                  <snm>Eichler</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Cheng</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Deakin</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Alsop</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Thompson</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kirby</snm>
                  <fnm>P</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2008</pubdate>
            <volume>453</volume>
            <fpage>175</fpage>
            <lpage>183</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18464734</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Characterization of the opossum immune genome provides insights into the evolution of the mammalian immune system.</p>
            </title>
            <aug>
               <au>
                  <snm>Belov</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Sanderson</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Deakin</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Assange</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>McColl</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Gout</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>de Bono</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Barrow</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Speed</snm>
                  <fnm>TP</fnm>
               </au>
               <au>
                  <snm>Trowsdale</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Papenfuss</snm>
                  <fnm>AT</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2007</pubdate>
            <volume>17</volume>
            <fpage>982</fpage>
            <lpage>991</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1899125</pubid>
                  <pubid idtype="pmpid" link="fulltext">17495011</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Transepithelial transport of immunoglobulins.</p>
            </title>
            <aug>
               <au>
                  <snm>Mostov</snm>
                  <fnm>KE</fnm>
               </au>
            </aug>
            <source>Annu Rev Immunol</source>
            <pubdate>1994</pubdate>
            <volume>12</volume>
            <fpage>63</fpage>
            <lpage>84</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8011293</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Ruminants genome no longer contains whey acidic protein gene but only a pseudogene.</p>
            </title>
            <aug>
               <au>
                  <snm>Hajjoubi</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rival-Gervier</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hayes</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Floriot</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Eggen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Piumi</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Chardon</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Houdebine</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Thepot</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2006</pubdate>
            <volume>370</volume>
            <fpage>104</fpage>
            <lpage>112</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16483732</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Proteomic analysis of two functional states of the Golgi complex in mammary epithelial cells.</p>
            </title>
            <aug>
               <au>
                  <snm>Wu</snm>
                  <fnm>CC</fnm>
               </au>
               <au>
                  <snm>Yates</snm>
                  <fnm>JR</fnm>
                  <suf>3rd</suf>
               </au>
               <au>
                  <snm>Neville</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Howell</snm>
                  <fnm>KE</fnm>
               </au>
            </aug>
            <source>Traffic</source>
            <pubdate>2000</pubdate>
            <volume>1</volume>
            <fpage>769</fpage>
            <lpage>782</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11208067</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Conversion of alpha-lactalbumin to a protein inducing apoptosis.</p>
            </title>
            <aug>
               <au>
                  <snm>Svensson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hakansson</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mossberg</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Linse</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Svanborg</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2000</pubdate>
            <volume>97</volume>
            <fpage>4221</fpage>
            <lpage>4226</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">18203</pubid>
                  <pubid idtype="pmpid" link="fulltext">10760289</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Lack of functional alpha-lactalbumin prevents involution in Cape fur seals and identifies the protein is an apoptotic milk factor in mammary gland involution.</p>
            </title>
            <aug>
               <au>
                  <snm>Sharp</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Lefevre</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nicholas</snm>
                  <fnm>KR</fnm>
               </au>
            </aug>
            <source>BMC Biol</source>
            <pubdate>2008</pubdate>
            <volume>6</volume>
            <fpage>48</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2600633</pubid>
                  <pubid idtype="pmpid" link="fulltext">18986549</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>A genomics approach to the detection of positive selection in cattle: adaptive evolution of the T-cell and natural killer cell-surface protein CD2.</p>
            </title>
            <aug>
               <au>
                  <snm>Lynn</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Freeman</snm>
                  <fnm>AR</fnm>
               </au>
               <au>
                  <snm>Murray</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bradley</snm>
                  <fnm>DG</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2005</pubdate>
            <volume>170</volume>
            <fpage>1189</fpage>
            <lpage>1196</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1451189</pubid>
                  <pubid idtype="pmpid" link="fulltext">15802510</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Nucleotide sequence evolution at the kappa-casein locus: evidence for positive selection within the family Bovidae.</p>
            </title>
            <aug>
               <au>
                  <snm>Ward</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Honeycutt</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Derr</snm>
                  <fnm>JN</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>1997</pubdate>
            <volume>147</volume>
            <fpage>1863</fpage>
            <lpage>1872</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1208352</pubid>
                  <pubid idtype="pmpid" link="fulltext">9409842</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Evolution and infant feeding.</p>
            </title>
            <aug>
               <au>
                  <snm>Dugdale</snm>
                  <fnm>AE</fnm>
               </au>
            </aug>
            <source>Lancet</source>
            <pubdate>1986</pubdate>
            <volume>1</volume>
            <fpage>670</fpage>
            <lpage>673</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2869357</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>The human genome browser at UCSC.</p>
            </title>
            <aug>
               <au>
                  <snm>Kent</snm>
                  <fnm>WJ</fnm>
               </au>
               <au>
                  <snm>Sugnet</snm>
                  <fnm>CW</fnm>
               </au>
               <au>
                  <snm>Furey</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Roskin</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Pringle</snm>
                  <fnm>TH</fnm>
               </au>
               <au>
                  <snm>Zahler</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Haussler</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>996</fpage>
            <lpage>1006</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">186604</pubid>
                  <pubid idtype="pmpid" link="fulltext">12045153</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>BLAT - the BLAST-like alignment tool.</p>
            </title>
            <aug>
               <au>
                  <snm>Kent</snm>
                  <fnm>WJ</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>656</fpage>
            <lpage>664</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">187518</pubid>
                  <pubid idtype="pmpid" link="fulltext">11932250</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>dbEST - database for "expressed sequence tags".</p>
            </title>
            <aug>
               <au>
                  <snm>Boguski</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Tolstoshev</snm>
                  <fnm>CM</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>1993</pubdate>
            <volume>4</volume>
            <fpage>332</fpage>
            <lpage>333</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8401577</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>The UCSC Table Browser data retrieval tool.</p>
            </title>
            <aug>
               <au>
                  <snm>Karolchik</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hinrichs</snm>
                  <fnm>AS</fnm>
               </au>
               <au>
                  <snm>Furey</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Roskin</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Sugnet</snm>
                  <fnm>CW</fnm>
               </au>
               <au>
                  <snm>Haussler</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kent</snm>
                  <fnm>WJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <issue>32 Database</issue>
            <fpage>D493</fpage>
            <lpage>D496</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308837</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681465</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Improving the specificity of high-throughput ortholog prediction.</p>
            </title>
            <aug>
               <au>
                  <snm>Fulton</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>YY</fnm>
               </au>
               <au>
                  <snm>Laird</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Horsman</snm>
                  <fnm>BG</fnm>
               </au>
               <au>
                  <snm>Roche</snm>
                  <fnm>FM</fnm>
               </au>
               <au>
                  <snm>Brinkman</snm>
                  <fnm>FS</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>270</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1524997</pubid>
                  <pubid idtype="pmpid" link="fulltext">16729895</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>GO-Elite</p>
            </title>
            <url>http://www.genmapp.org/go_elite/go_elite.html</url>
         </bibl>
         <bibl id="B60">
            <title>
               <p>Ingenuity Pathways Analysis</p>
            </title>
            <url>http://www.ingenuity.com/products/pathways_analysis.html</url>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Multtest R library</p>
            </title>
            <url>http://bioconductor.org/</url>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Multiple testing procedures: R multtest package and applications to genomics.</p>
            </title>
            <aug>
               <au>
                  <snm>Pollard</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Dudoit</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Laan</snm>
                  <mnm>van der</mnm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>Bioinformatics and Computational Biology Solutions Using R and Bioconductor</source>
            <publisher>Springer</publisher>
            <editor>Gentleman R, Carey V, Huber W, Irizarry R, Dudoit S</editor>
            <pubdate>2005</pubdate>
            <fpage>251</fpage>
            <lpage>272</lpage>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Identifying genetic networks underlying myometrial transition to labor.</p>
            </title>
            <aug>
               <au>
                  <snm>Salomonis</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Cotte</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Zambon</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Pollard</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Vranizan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Doniger</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Dolganov</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Conklin</snm>
                  <fnm>BR</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <fpage>R12</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">551532</pubid>
                  <pubid idtype="pmpid" link="fulltext">15693941</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p>OrthoDB: the hierarchical catalog of eukaryotic orthologs.</p>
            </title>
            <aug>
               <au>
                  <snm>Kriventseva</snm>
                  <fnm>EV</fnm>
               </au>
               <au>
                  <snm>Rahman</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Espinosa</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Zdobnov</snm>
                  <fnm>EM</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2008</pubdate>
            <issue>36 Database</issue>
            <fpage>D271</fpage>
            <lpage>D275</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2238902</pubid>
                  <pubid idtype="pmpid" link="fulltext">17947323</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>Ensembl 2007.</p>
            </title>
            <aug>
               <au>
                  <snm>Hubbard</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Aken</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Beal</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ballester</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Caccamo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Coates</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Cutts</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Down</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Dyer</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Fitzgerald</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fernandez-Banet</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Graf</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Haider</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hammond</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Herrero</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kahari</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Keefe</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kokocinski</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kulesha</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Lawson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Longden</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Melsopp</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Megy</snm>
                  <fnm>K</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <issue>35 Database</issue>
            <fpage>D610</fpage>
            <lpage>D617</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1761443</pubid>
                  <pubid idtype="pmpid" link="fulltext">17148474</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>The Bovine Genome Database</p>
            </title>
            <url>http://BovineGenome.org</url>
         </bibl>
         <bibl id="B67">
            <title>
               <p>The Universal Protein Resource (UniProt).</p>
            </title>
            <source>Nucleic Acids Res</source>
            <pubdate>2008</pubdate>
            <issue>36 Database</issue>
            <fpage>D190</fpage>
            <lpage>D195</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2238893</pubid>
                  <pubid idtype="pmpid" link="fulltext">18045787</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Cluster analysis and display of genome-wide expression patterns.</p>
            </title>
            <aug>
               <au>
                  <snm>Eisen</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>Spellman</snm>
                  <fnm>PT</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>PO</fnm>
               </au>
               <au>
                  <snm>Botstein</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1998</pubdate>
            <volume>95</volume>
            <fpage>14863</fpage>
            <lpage>14868</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">24541</pubid>
                  <pubid idtype="pmpid" link="fulltext">9843981</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>PermutMatrix: a graphical environment to arrange gene expression profiles in optimal linear order.</p>
            </title>
            <aug>
               <au>
                  <snm>Caraux</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Pinloche</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>1280</fpage>
            <lpage>1281</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15546938</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>Ensembl 2008.</p>
            </title>
            <aug>
               <au>
                  <snm>Flicek</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Aken</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Beal</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ballester</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Caccamo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Coates</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Cutts</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Down</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Dyer</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Eyre</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Fitzgerald</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fernandez-Banet</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Gr&#228;f</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Haider</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hammond</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Jenkinson</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>K&#228;h&#228;ri</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Keefe</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kokocinski</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kulesha</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Lawson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Longden</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Megy</snm>
                  <fnm>K</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2008</pubdate>
            <issue>36 Database</issue>
            <fpage>D707</fpage>
            <lpage>D714</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2238821</pubid>
                  <pubid idtype="pmpid" link="fulltext">18000006</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>MUSCLE: multiple sequence alignment with high accuracy and high throughput.</p>
            </title>
            <aug>
               <au>
                  <snm>Edgar</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>1792</fpage>
            <lpage>1797</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">390337</pubid>
                  <pubid idtype="pmpid" link="fulltext">15034147</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Guindon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gascuel</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Syst Biol</source>
            <pubdate>2003</pubdate>
            <volume>52</volume>
            <fpage>696</fpage>
            <lpage>704</lpage>
            <xrefbib>
               <pubid idtype="pmpid">14530136</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>PHYML Online - a web server for fast maximum likelihood-based phylogenetic inference.</p>
            </title>
            <aug>
               <au>
                  <snm>Guindon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lethiec</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Duroux</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Gascuel</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <issue>33 Web Server</issue>
            <fpage>W557</fpage>
            <lpage>W559</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1160113</pubid>
                  <pubid idtype="pmpid" link="fulltext">15980534</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B74">
            <title>
               <p>The rapid generation of mutation data matrices from protein sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Jones</snm>
                  <fnm>DT</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>Thornton</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Comput Appl Biosci</source>
            <pubdate>1992</pubdate>
            <volume>8</volume>
            <fpage>275</fpage>
            <lpage>282</lpage>
            <xrefbib>
               <pubid idtype="pmpid">1633570</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B75">
            <title>
               <p>PAML 4: phylogenetic analysis by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1586</fpage>
            <lpage>1591</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17483113</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B76">
            <title>
               <p>Miscellaneous factors affecting composition and volume of human and bovine milks.</p>
            </title>
            <aug>
               <au>
                  <snm>Jensen</snm>
                  <fnm>RG</fnm>
               </au>
            </aug>
            <source>Handbook of Milk Composition</source>
            <publisher>Academic Press, Inc</publisher>
            <editor>Jensen RG</editor>
            <pubdate>1995</pubdate>
            <fpage>237</fpage>
            <lpage>267</lpage>
         </bibl>
         <bibl id="B77">
            <title>
               <p>Phylogenetic variation in the gross composition of milks.</p>
            </title>
            <aug>
               <au>
                  <snm>Oftedal</snm>
                  <fnm>OT</fnm>
               </au>
               <au>
                  <snm>Iverson</snm>
                  <fnm>SJ</fnm>
               </au>
            </aug>
            <source>Handbook of Milk Composition</source>
            <publisher>Academic Press, Inc</publisher>
            <editor>Jensen RG</editor>
            <pubdate>1995</pubdate>
            <fpage>749</fpage>
            <lpage>780</lpage>
         </bibl>
         <bibl id="B78">
            <title>
               <p>Milk composition in an American marsupial (<it>Monodelphis domestica</it>).</p>
            </title>
            <aug>
               <au>
                  <snm>Green</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>VandeBerg</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Newgrain</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Comp Biochem Physiol B</source>
            <pubdate>1991</pubdate>
            <volume>99</volume>
            <fpage>663</fpage>
            <lpage>665</lpage>
            <xrefbib>
               <pubid idtype="pmpid">1769214</pubid>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
