<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sat, 26 Jul 2008 07:34:30 BST</pubDate>


	<title>CiteULike: macavity1g's library [61 articles]</title>
	<description>CiteULike: macavity1g's library [61 articles]</description>


	<link>http://www.citeulike.org/user/macavity1g</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/812748"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/2140896"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1324276"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/835519"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1238"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1122908"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1268851"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/697707"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/349668"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/63158"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1068457"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1038497"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1164885"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1164880"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1105945"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/695901"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/973077"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/927557"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/530843"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/63193"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/118774"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1031417"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/597632"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/994277"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1088407"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/504895"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1038480"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1133608"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/352759"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/473090"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/447448"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1090877"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/927698"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1133679"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1133459"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1052952"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/591480"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1152294"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/825696"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/504893"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1030057"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/504894"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/547897"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1052789"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1152288"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1023353"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/911311"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/1075871"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/220934"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/macavity1g/article/604164"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/macavity1g/article/812748">
    <title>Group testing for pathway analysis improves comparability of different microarray data sets.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/812748</link>
    <description>&lt;i&gt;Bioinformatics (7 August 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: The wide use of DNA microarrays for the investigation of the cell transcriptome triggered the invention of numerous methods for the processing of microarray data and lead to a growing number of microarray studies that examine the same biological conditions. However, comparisons made on the level of gene lists obtained by different statistical methods or from different data sets hardly converge. We aimed at examining such discrepancies on the level of apparently affected biologically related groups of genes, for example metabolic or signalling pathways. This can be achieved by group testing procedures, e.g. over-representation analysis (ORA), bluefunctional class scoring (FCS), or global tests. RESULTS: Three public prostate cancer data sets obtained with the same microarray platform (HGU95A/HGU95av2) were analyzed. Each data set was subjected to normalization by either variance stabilizing normalization (vsn) or mixed model normalization (MMN). Then, statistical analysis of microarrays (SAM) was applied to the vsn-normalized data and mixed model analsis (MMA) to the data normalized by MMN. For multiple testing adjustment the false discovery rate (FDR) was calculated and the threshold was set to 0.05. Gene lists from the same method applied to different data sets showed overlaps between 42% and 52%, while lists from different methods applied to the same data set had between 63% and 85% of genes in common. A number of six gene lists obtained by the two statistical methods applied to the three data sets was then subjected to group testing by blueFisher's exact test. Group testing by GSEA and global test was applied to the three data sets, as well. Fisher's exact test followed by global test showed more consistent results with respect to the concordance between analyses on gene lists obtained by different methods and different data sets than the GSEA. However, all group testing methods identified pathways that had already been described to be involved in the pathogenesis of prostate cancer. Moreover, pathways recurrently identified in these analyses are more likely to be reliable than those from a single analysis on a single data set. Supplementary Info: Supplementary Figure 1 and Supplementary Tables 1-4 are available from the Journal's website.</description>
    <dc:title>Group testing for pathway analysis improves comparability of different microarray data sets.</dc:title>

    <dc:creator>Theodora Manoli</dc:creator>
    <dc:creator>Norbert Gretz</dc:creator>
    <dc:creator>Hermann-Josef Gröne</dc:creator>
    <dc:creator>Marc Kenzelmann</dc:creator>
    <dc:creator>Roland Eils</dc:creator>
    <dc:creator>Benedikt Brors</dc:creator>
    <dc:source>Bioinformatics (7 August 2006)</dc:source>
    <dc:date>2006-08-22T14:19:27-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1460-2059</prism:issn>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/2140896">
    <title>Module-based outcome prediction using breast cancer compendia.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/2140896</link>
    <description>&lt;i&gt;PLoS ONE, Vol. 2, No. 10. (2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: The availability of large collections of microarray datasets (compendia), or knowledge about grouping of genes into pathways (gene sets), is typically not exploited when training predictors of disease outcome. These can be useful since a compendium increases the number of samples, while gene sets reduce the size of the feature space. This should be favorable from a machine learning perspective and result in more robust predictors. METHODOLOGY: We extracted modules of regulated genes from gene sets, and compendia. Through supervised analysis, we constructed predictors which employ modules predictive of breast cancer outcome. To validate these predictors we applied them to independent data, from the same institution (intra-dataset), and other institutions (inter-dataset). CONCLUSIONS: We show that modules derived from single breast cancer datasets achieve better performance on the validation data compared to gene-based predictors. We also show that there is a trend in compendium specificity and predictive performance: modules derived from a single breast cancer dataset, and a breast cancer specific compendium perform better compared to those derived from a human cancer compendium. Additionally, the module-based predictor provides a much richer insight into the underlying biology. Frequently selected gene sets are associated with processes such as cell cycle, E2F regulation, DNA damage response, proteasome and glycolysis. We analyzed two modules related to cell cycle, and the OCT1 transcription factor, respectively. On an individual basis, these modules provide a significant separation in survival subgroups on the training and independent validation data.</description>
    <dc:title>Module-based outcome prediction using breast cancer compendia.</dc:title>

    <dc:creator>MH van Vliet</dc:creator>
    <dc:creator>CN Klijn</dc:creator>
    <dc:creator>LF Wessels</dc:creator>
    <dc:creator>MJ Reinders</dc:creator>
    <dc:identifier>doi:10.1371/journal.pone.0001047</dc:identifier>
    <dc:source>PLoS ONE, Vol. 2, No. 10. (2007)</dc:source>
    <dc:date>2007-12-18T13:02:16-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>PLoS ONE</prism:publicationName>
    <prism:issn>1932-6203</prism:issn>
    <prism:volume>2</prism:volume>
    <prism:number>10</prism:number>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1324276">
    <title>GOSim - An R-package for computation of information theoretic GO similarities between terms and gene products</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1324276</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 8 (22 May 2007), 166.&lt;/i&gt;</description>
    <dc:title>GOSim - An R-package for computation of information theoretic GO similarities between terms and gene products</dc:title>

    <dc:creator>Holger Froehlich</dc:creator>
    <dc:creator>Nora Speer</dc:creator>
    <dc:creator>Annemarie Poustka</dc:creator>
    <dc:creator>Tim Beissbarth</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-8-166</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 8 (22 May 2007), 166.</dc:source>
    <dc:date>2007-05-24T04:38:16-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>8</prism:volume>
    <prism:startingPage>166</prism:startingPage>
    <prism:category>go</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/835519">
    <title>Coexpression analysis of human genes across many microarray data sets.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/835519</link>
    <description>&lt;i&gt;Genome Res, Vol. 14, No. 6. (June 2004), pp. 1085-1094.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a large-scale analysis of mRNA coexpression based on 60 large human data sets containing a total of 3924 microarrays. We sought pairs of genes that were reliably coexpressed (based on the correlation of their expression profiles) in multiple data sets, establishing a high-confidence network of 8805 genes connected by 220,649 &#34;coexpression links&#34; that are observed in at least three data sets. Confirmed positive correlations between genes were much more common than confirmed negative correlations. We show that confirmation of coexpression in multiple data sets is correlated with functional relatedness, and show how cluster analysis of the network can reveal functionally coherent groups of genes. Our findings demonstrate how the large body of accumulated microarray data can be exploited to increase the reliability of inferences about gene function.</description>
    <dc:title>Coexpression analysis of human genes across many microarray data sets.</dc:title>

    <dc:creator>HK Lee</dc:creator>
    <dc:creator>AK Hsu</dc:creator>
    <dc:creator>J Sajdak</dc:creator>
    <dc:creator>J Qin</dc:creator>
    <dc:creator>P Pavlidis</dc:creator>
    <dc:identifier>doi:10.1101/gr.1910904</dc:identifier>
    <dc:source>Genome Res, Vol. 14, No. 6. (June 2004), pp. 1085-1094.</dc:source>
    <dc:date>2006-09-08T15:43:38-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Genome Res</prism:publicationName>
    <prism:issn>1088-9051</prism:issn>
    <prism:volume>14</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>1085</prism:startingPage>
    <prism:endingPage>1094</prism:endingPage>
    <prism:category>go</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1238">
    <title>An information-theoretic definition of similarity</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1238</link>
    <description>&lt;i&gt;(1998), pp. 296-304.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Similarity is an important and widely used concept. Previous definitions of similarity are tied to a particular application or a form of knowledge representation. We present an informationtheoretic definition of similarity that is applicable as long as there is a probabilistic model. We demonstrate how our definition can be used to measure the similarity in a number of different domains. 1 Introduction Similarity is a fundamental and widely used concept. Many similarity measures have been...</description>
    <dc:title>An information-theoretic definition of similarity</dc:title>

    <dc:creator>Dekang Lin</dc:creator>
    <dc:source>(1998), pp. 296-304.</dc:source>
    <dc:date>2004-12-01T09:41:43-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>296</prism:startingPage>
    <prism:endingPage>304</prism:endingPage>
    <prism:publisher>Morgan Kaufmann, San Francisco, CA</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1122908">
    <title>Semantic Similarity Based on Corpus Statistics and Lexical Taxonomy</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1122908</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Semantic Similarity Based on Corpus Statistics and Lexical Taxonomy</dc:title>

    <dc:creator>Jay Jiang</dc:creator>
    <dc:creator>David Conrath</dc:creator>
    <dc:date>2007-02-26T13:33:28-00:00</dc:date>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1268851">
    <title>Correlation between gene expression and GO semantic similarity.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1268851</link>
    <description>&lt;i&gt;IEEE/ACM Trans Comput Biol Bioinform, Vol. 2, No. 4. (c 2005), pp. 330-338.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This research analyzes some aspects of the relationship between gene expression, gene function, and gene annotation. Many recent studies are implicitly based on the assumption that gene products that are biologically and functionally related would maintain this similarity both in their expression profiles as well as in their Gene Ontology (GO) annotation. We analyze how accurate this assumption proves to be using real publicly available data. We also aim to validate a measure of semantic similarity for GO annotation. We use the Pearson correlation coefficient and its absolute value as a measure of similarity between expression profiles of gene products. We explore a number of semantic similarity measures (Resnik, Jiang, and Lin) and compute the similarity between gene products annotated using the GO. Finally, we compute correlation coefficients to compare gene expression similarity against GO semantic similarity. Our results suggest that the Resnik similarity measure outperforms the others and seems better suited for use in Gene Ontology. We also deduce that there seems to be correlation between semantic similarity in the GO annotation and gene expression for the three GO ontologies. We show that this correlation is negligible up to a certain semantic similarity value; then, for higher similarity values, the relationship trend becomes almost linear. These results can be used to augment the knowledge provided by clustering algorithms and in the development of bioinformatic tools for finding and characterizing gene products.</description>
    <dc:title>Correlation between gene expression and GO semantic similarity.</dc:title>

    <dc:creator>JL Sevilla</dc:creator>
    <dc:creator>V Segura</dc:creator>
    <dc:creator>A Podhorski</dc:creator>
    <dc:creator>E Guruceaga</dc:creator>
    <dc:creator>JM Mato</dc:creator>
    <dc:creator>LA Martínez-Cruz</dc:creator>
    <dc:creator>FJ Corrales</dc:creator>
    <dc:creator>A Rubio</dc:creator>
    <dc:identifier>doi:10.1109/TCBB.2005.50</dc:identifier>
    <dc:source>IEEE/ACM Trans Comput Biol Bioinform, Vol. 2, No. 4. (c 2005), pp. 330-338.</dc:source>
    <dc:date>2007-04-30T18:15:25-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>IEEE/ACM Trans Comput Biol Bioinform</prism:publicationName>
    <prism:issn>1545-5963</prism:issn>
    <prism:volume>2</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>330</prism:startingPage>
    <prism:endingPage>338</prism:endingPage>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/697707">
    <title>A new measure for functional similarity of gene products based on Gene Ontology</title>
    <link>http://www.citeulike.org/user/macavity1g/article/697707</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7 (15 June 2006), 302.&lt;/i&gt;</description>
    <dc:title>A new measure for functional similarity of gene products based on Gene Ontology</dc:title>

    <dc:creator>Andreas Schlicker</dc:creator>
    <dc:creator>Francisco Domingues</dc:creator>
    <dc:creator>Jorg Rahnenfuhrer</dc:creator>
    <dc:creator>Thomas Lengauer</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-7-302</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 7 (15 June 2006), 302.</dc:source>
    <dc:date>2006-06-16T01:26:59-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:startingPage>302</prism:startingPage>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/349668">
    <title>Ontological analysis of gene expression data: current tools, limitations, and open problems.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/349668</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 21, No. 18. (15 September 2005), pp. 3587-3595.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Independent of the platform and the analysis methods used, the result of a microarray experiment is, in most cases, a list of differentially expressed genes. An automatic ontological analysis approach has been recently proposed to help with the biological interpretation of such results. Currently, this approach is the de facto standard for the secondary analysis of high throughput experiments and a large number of tools have been developed for this purpose. We present a detailed comparison of 14 such tools using the following criteria: scope of the analysis, visualization capabilities, statistical model(s) used, correction for multiple comparisons, reference microarrays available, installation issues and sources of annotation data. This detailed analysis of the capabilities of these tools will help researchers choose the most appropriate tool for a given type of analysis. More importantly, in spite of the fact that this type of analysis has been generally adopted, this approach has several important intrinsic drawbacks. These drawbacks are associated with all tools discussed and represent conceptual limitations of the current state-of-the-art in ontological analysis. We propose these as challenges for the next generation of secondary data analysis tools.</description>
    <dc:title>Ontological analysis of gene expression data: current tools, limitations, and open problems.</dc:title>

    <dc:creator>P Khatri</dc:creator>
    <dc:creator>S Drăghici</dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/bti565</dc:identifier>
    <dc:source>Bioinformatics, Vol. 21, No. 18. (15 September 2005), pp. 3587-3595.</dc:source>
    <dc:date>2005-10-13T02:53:06-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>21</prism:volume>
    <prism:number>18</prism:number>
    <prism:startingPage>3587</prism:startingPage>
    <prism:endingPage>3595</prism:endingPage>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/63158">
    <title>GO::TermFinder-open source software for accessing Gene Ontology information and finding significantly enriched Gene Ontology terms associated with a list of genes</title>
    <link>http://www.citeulike.org/user/macavity1g/article/63158</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 20, No. 18., 3710.&lt;/i&gt;</description>
    <dc:title>GO::TermFinder-open source software for accessing Gene Ontology information and finding significantly enriched Gene Ontology terms associated with a list of genes</dc:title>

    <dc:creator>Elizabeth Boyle</dc:creator>
    <dc:creator>Shuai Weng</dc:creator>
    <dc:creator>Jeremy Gollub</dc:creator>
    <dc:creator>Heng Jin</dc:creator>
    <dc:creator>David Botstein</dc:creator>
    <dc:creator>Michael Cherry</dc:creator>
    <dc:creator>Gavin Sherlock</dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/bth456</dc:identifier>
    <dc:source>Bioinformatics, Vol. 20, No. 18., 3710.</dc:source>
    <dc:date>2004-12-28T18:22:25-00:00</dc:date>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>20</prism:volume>
    <prism:number>18</prism:number>
    <prism:startingPage>3710</prism:startingPage>
    <prism:publisher>Oxford University Press</prism:publisher>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1068457">
    <title>Using GOstats to test gene lists for GO term association</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1068457</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 23, No. 2. (15 January 2007), pp. 257-258.&lt;/i&gt;</description>
    <dc:title>Using GOstats to test gene lists for GO term association</dc:title>

    <dc:creator>Falcon</dc:creator>
    <dc:creator></dc:creator>
    <dc:creator>Gentleman</dc:creator>
    <dc:creator></dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/btl567</dc:identifier>
    <dc:source>Bioinformatics, Vol. 23, No. 2. (15 January 2007), pp. 257-258.</dc:source>
    <dc:date>2007-01-26T03:04:21-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>23</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>257</prism:startingPage>
    <prism:endingPage>258</prism:endingPage>
    <prism:publisher>Oxford University Press</prism:publisher>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1038497">
    <title>GO PaD: the Gene Ontology Partition Database.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1038497</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 35, No. Database issue. (January 2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Gene Ontology (GO) has been widely used to infer functional significance associated with sets of genes in order to automate discoveries within large-scale genetic studies. A level in GO's direct acyclic graph structure is often assumed to be indicative of its terms' specificities, although other work has suggested this assumption does not hold. Unfortunately, quantitative analysis of biological functions based on nodes at the same level (as is common in gene enrichment analysis tools) can lead to incorrect conclusions as well as missed discoveries due to inefficient use of available information. This paper addresses these using an informational theoretic approach encoded in the GO Partition Database that guarantees to maximize information for gene enrichment analysis. The GO Partition Database was designed to feature ontology partitions with GO terms of similar specificity. The GO partitions comprise varying numbers of nodes and present relevant information theoretic statistics, so researchers can choose to analyze datasets at arbitrary levels of specificity. The GO Partition Database, featuring GO partition sets for functional analysis of genes from human and 10 other commonly studied organisms with a total of 131,972 genes, is available on the internet at: bcl.med.harvard.edu/proj/gopart. The site also includes an online tutorial.</description>
    <dc:title>GO PaD: the Gene Ontology Partition Database.</dc:title>

    <dc:creator>G Alterovitz</dc:creator>
    <dc:creator>M Xiang</dc:creator>
    <dc:creator>M Mohan</dc:creator>
    <dc:creator>MF Ramoni</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 35, No. Database issue. (January 2007)</dc:source>
    <dc:date>2007-01-12T17:18:10-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>35</prism:volume>
    <prism:number>Database issue</prism:number>
    <prism:category>go</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1164885">
    <title>A robust hybrid between genetic algorithm and support vector machine for extracting an optimal feature gene subset.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1164885</link>
    <description>&lt;i&gt;Genomics, Vol. 85, No. 1. (January 2005), pp. 16-23.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Development of a robust and efficient approach for extracting useful information from microarray data continues to be a significant and challenging task. Microarray data are characterized by a high dimension, high signal-to-noise ratio, and high correlations between genes, but with a relatively small sample size. Current methods for dimensional reduction can further be improved for the scenario of the presence of a single (or a few) high influential gene(s) in which its effect in the feature subset would prohibit inclusion of other important genes. We have formalized a robust gene selection approach based on a hybrid between genetic algorithm and support vector machine. The major goal of this hybridization was to exploit fully their respective merits (e.g., robustness to the size of solution space and capability of handling a very large dimension of feature genes) for identification of key feature genes (or molecular signatures) for a complex biological phenotype. We have applied the approach to the microarray data of diffuse large B cell lymphoma to demonstrate its behaviors and properties for mining the high-dimension data of genome-wide gene expression profiles. The resulting classifier(s) (the optimal gene subset(s)) has achieved the highest accuracy (99%) for prediction of independent microarray samples in comparisons with marginal filters and a hybrid between genetic algorithm and K nearest neighbors.</description>
    <dc:title>A robust hybrid between genetic algorithm and support vector machine for extracting an optimal feature gene subset.</dc:title>

    <dc:creator>L Li</dc:creator>
    <dc:creator>W Jiang</dc:creator>
    <dc:creator>X Li</dc:creator>
    <dc:creator>KL Moser</dc:creator>
    <dc:creator>Z Guo</dc:creator>
    <dc:creator>L Du</dc:creator>
    <dc:creator>Q Wang</dc:creator>
    <dc:creator>EJ Topol</dc:creator>
    <dc:creator>Q Wang</dc:creator>
    <dc:creator>S Rao</dc:creator>
    <dc:identifier>doi:10.1016/j.ygeno.2004.09.007</dc:identifier>
    <dc:source>Genomics, Vol. 85, No. 1. (January 2005), pp. 16-23.</dc:source>
    <dc:date>2007-03-14T22:08:27-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Genomics</prism:publicationName>
    <prism:issn>0888-7543</prism:issn>
    <prism:volume>85</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>16</prism:startingPage>
    <prism:endingPage>23</prism:endingPage>
    <prism:category>geneticalgorithm</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1164880">
    <title>Finding the Optimal Gene Order in Displaying Microarray Data</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1164880</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The rapid advances of genome-scale sequencing have brought out the necessity of developing new data processing techniques for enormous genomic data. Microarrays, for example, can generate such a large number of gene expression data that we usually analyze them with some clustering algorithms. However, the clustering algorithms have been ine ective for visualization in that they are not concerned about the order of genes in each cluster. In this paper, a hybrid genetic algorithm for...</description>
    <dc:title>Finding the Optimal Gene Order in Displaying Microarray Data</dc:title>

    <dc:creator>Seung Lee</dc:creator>
    <dc:creator>Yong Kim</dc:creator>
    <dc:creator>Byung Moon</dc:creator>
    <dc:date>2007-03-14T22:01:28-00:00</dc:date>
    <prism:category>geneticalgorithm</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1105945">
    <title>A parallel genetic algorithm for single class pattern classification and its application for gene expression profiling in Streptomyces coelicolor.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1105945</link>
    <description>&lt;i&gt;BMC Genomics, Vol. 8 (13 February 2007), 49.&lt;/i&gt;</description>
    <dc:title>A parallel genetic algorithm for single class pattern classification and its application for gene expression profiling in Streptomyces coelicolor.</dc:title>

    <dc:creator>Cuong To</dc:creator>
    <dc:creator>Jiri Vohradsky</dc:creator>
    <dc:identifier>doi:10.1186/1471-2164-8-49</dc:identifier>
    <dc:source>BMC Genomics, Vol. 8 (13 February 2007), 49.</dc:source>
    <dc:date>2007-02-13T21:30:34-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>BMC Genomics</prism:publicationName>
    <prism:issn>1471-2164</prism:issn>
    <prism:volume>8</prism:volume>
    <prism:startingPage>49</prism:startingPage>
    <prism:category>geneticalgorithm</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/695901">
    <title>Towards precise classification of cancers based on robust gene functional expression profiles</title>
    <link>http://www.citeulike.org/user/macavity1g/article/695901</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 6, No. 1. (2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:Development of robust and efficient methods for analyzing and interpreting high dimension gene expression profiles continues to be a focus in computational biology. The accumulated experiment evidence supports the assumption that genes express and perform their functions in modular fashions in cells. Therefore, there is an open space for development of the timely and relevant computational algorithms that use robust functional expression profiles towards precise classification of complex human diseases at the modular level.RESULTS:Inspired by the insight that genes act as a module to carry out a highly integrated cellular function, we thus define a low dimension functional expression profile for data reduction. After annotating each individual gene to functional categories defined in a proper gene function classification system such as Gene Ontology applied in this study, we identify those functional categories enriched with differentially expressed genes. For each functional category or functional module, we compute a summary measure (s) for the raw expression values of the annotated genes to capture the overall activity level of the module. In this way, we can treat the gene expressions within a functional module as an integrative data point to replace the multiple values of individual genes. We compare the classification performance of decision trees based on functional expression profiles with the conventional gene expression profiles using four publicly available datasets, which indicates that precise classification of tumour types and improved interpretation can be achieved with the reduced functional expression profiles.CONCLUSION:This modular approach is demonstrated to be a powerful alternative approach to analyzing high dimension microarray data and is robust to high measurement noise and intrinsic biological variance inherent in microarray data. Furthermore, efficient integration with current biological knowledge has facilitated the interpretation of the underlying molecular mechanisms for complex human diseases at the modular level.</description>
    <dc:title>Towards precise classification of cancers based on robust gene functional expression profiles</dc:title>

    <dc:creator>Zheng Guo</dc:creator>
    <dc:creator>Tianwen Zhang</dc:creator>
    <dc:creator>Xia Li</dc:creator>
    <dc:creator>Qi Wang</dc:creator>
    <dc:creator>Jianzhen Xu</dc:creator>
    <dc:creator>Hui Yu</dc:creator>
    <dc:creator>Jing Zhu</dc:creator>
    <dc:creator>Haiyun Wang</dc:creator>
    <dc:creator>Chenguang Wang</dc:creator>
    <dc:creator>Eric Topol</dc:creator>
    <dc:creator>Qing Wang</dc:creator>
    <dc:creator>Shaoqi Rao</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-6-58</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 6, No. 1. (2005)</dc:source>
    <dc:date>2006-06-14T14:11:32-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:volume>6</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>go</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/973077">
    <title>Using the principle of entropy maximization to infer genetic interaction networks from gene expression patterns.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/973077</link>
    <description>&lt;i&gt;Proc Natl Acad Sci U S A (30 November 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe a method based on the principle of entropy maximization to identify the gene interaction network with the highest probability of giving rise to experimentally observed transcript profiles. In its simplest form, the method yields the pairwise gene interaction network, but it can also be extended to deduce higher-order interactions. Analysis of microarray data from genes in Saccharomyces cerevisiae chemostat cultures exhibiting energy metabolic oscillations identifies a gene interaction network that reflects the intracellular communication pathways that adjust cellular metabolic activity and cell division to the limiting nutrient conditions that trigger metabolic oscillations. The success of the present approach in extracting meaningful genetic connections suggests that the maximum entropy principle is a useful concept for understanding living systems, as it is for other complex, nonequilibrium systems.</description>
    <dc:title>Using the principle of entropy maximization to infer genetic interaction networks from gene expression patterns.</dc:title>

    <dc:creator>Timothy R Lezon</dc:creator>
    <dc:creator>Jayanth R Banavar</dc:creator>
    <dc:creator>Marek Cieplak</dc:creator>
    <dc:creator>Amos Maritan</dc:creator>
    <dc:creator>Nina V Fedoroff</dc:creator>
    <dc:identifier>doi:10.1073/pnas.0609152103</dc:identifier>
    <dc:source>Proc Natl Acad Sci U S A (30 November 2006)</dc:source>
    <dc:date>2006-12-04T13:28:19-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Proc Natl Acad Sci U S A</prism:publicationName>
    <prism:issn>0027-8424</prism:issn>
    <prism:category>entropy</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/927557">
    <title>Inference of disease-related molecular logic from systems-based microarray analysis.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/927557</link>
    <description>&lt;i&gt;PLoS Comput Biol, Vol. 2, No. 6. (16 June 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Computational analysis of gene expression data from microarrays has been useful for medical diagnosis and prognosis. The ability to analyze such data at the level of biological modules, rather than individual genes, has been recognized as important for improving our understanding of disease-related pathways. It has proved difficult, however, to infer pathways from microarray data by deriving modules of multiple synergistically interrelated genes, rather than individual genes. Here we propose a systems-based approach called Entropy Minimization and Boolean Parsimony (EMBP) that identifies, directly from gene expression data, modules of genes that are jointly associated with disease. Furthermore, the technique provides insight into the underlying biomolecular logic by inferring a logic function connecting the joint expression levels in a gene module with the outcome of disease. Coupled with biological knowledge, this information can be useful for identifying disease-related pathways, suggesting potential therapeutic approaches for interfering with the functions of such pathways. We present an example providing such gene modules associated with prostate cancer from publicly available gene expression data, and we successfully validate the results on additional independently derived data. Our results indicate a link between prostate cancer and cellular damage from oxidative stress combined with inhibition of apoptotic mechanisms normally triggered by such damage.</description>
    <dc:title>Inference of disease-related molecular logic from systems-based microarray analysis.</dc:title>

    <dc:creator>V Varadan</dc:creator>
    <dc:creator>D Anastassiou</dc:creator>
    <dc:identifier>doi:10.1371/journal.pcbi.0020068</dc:identifier>
    <dc:source>PLoS Comput Biol, Vol. 2, No. 6. (16 June 2006)</dc:source>
    <dc:date>2006-11-03T16:26:12-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>PLoS Comput Biol</prism:publicationName>
    <prism:issn>1553-7358</prism:issn>
    <prism:volume>2</prism:volume>
    <prism:number>6</prism:number>
    <prism:category>entropy</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/530843">
    <title>An entropy-based gene selection method for cancer classification using microarray data.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/530843</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 6, No. 1. (2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Accurate diagnosis of cancer subtypes remains a challenging problem. Building classifiers based on gene expression data is a promising approach; yet the selection of non-redundant but relevant genes is difficult. The selected gene set should be small enough to allow diagnosis even in regular clinical laboratories and ideally identify genes involved in cancer-specific regulatory pathways. Here an entropy-based method is proposed that selects genes related to the different cancer classes while at the same time reducing the redundancy among the genes. RESULTS: The present study identifies a subset of features by maximizing the relevance and minimizing the redundancy of the selected genes. A merit called normalized mutual information is employed to measure the relevance and the redundancy of the genes. In order to find a more representative subset of features, an iterative procedure is adopted that incorporates an initial clustering followed by data partitioning and the application of the algorithm to each of the partitions. A leave-one-out approach then selects the most commonly selected genes across all the different runs and the gene selection algorithm is applied again to pare down the list of selected genes until a minimal subset is obtained that gives a satisfactory accuracy of classification. The algorithm was applied to three different data sets and the results obtained were compared to work done by others using the same data sets. CONCLUSION: This study presents an entropy-based iterative algorithm for selecting genes from microarray data that are able to classify various cancer sub-types with high accuracy. In addition, the feature set obtained is very compact, that is, the redundancy between genes is reduced to a large extent. This implies that classifiers can be built with a smaller subset of genes.</description>
    <dc:title>An entropy-based gene selection method for cancer classification using microarray data.</dc:title>

    <dc:creator>X Liu</dc:creator>
    <dc:creator>A Krishnan</dc:creator>
    <dc:creator>A Mondry</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-6-76</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 6, No. 1. (2005)</dc:source>
    <dc:date>2006-03-04T12:00:25-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>6</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>entropy</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/63193">
    <title>The `subsequent artificial neural network' (SANN) approach might bring more classificatory power to ANN-based DNA microarray analyses</title>
    <link>http://www.citeulike.org/user/macavity1g/article/63193</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 20, No. 18., 3544.&lt;/i&gt;</description>
    <dc:title>The `subsequent artificial neural network' (SANN) approach might bring more classificatory power to ANN-based DNA microarray analyses</dc:title>

    <dc:creator>Roland Linder</dc:creator>
    <dc:creator>Dawn Dew</dc:creator>
    <dc:creator>Holger Sudhoff</dc:creator>
    <dc:creator>Dirk Theegarten</dc:creator>
    <dc:creator>Klaus Remberger</dc:creator>
    <dc:creator>Siegfried Poppl</dc:creator>
    <dc:creator>Mathias Wagner</dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/bth441</dc:identifier>
    <dc:source>Bioinformatics, Vol. 20, No. 18., 3544.</dc:source>
    <dc:date>2004-12-28T18:22:26-00:00</dc:date>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>20</prism:volume>
    <prism:number>18</prism:number>
    <prism:startingPage>3544</prism:startingPage>
    <prism:publisher>Oxford University Press</prism:publisher>
    <prism:category>microarray</prism:category>
    <prism:category>neuralnetwork</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/118774">
    <title>Neural network analysis of lymphoma microarray data: prognosis and diagnosis near-perfect.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/118774</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 4, No. 1. (10 April 2003)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Microarray chips are being rapidly deployed as a major tool in genomic research. To date most of the analysis of the enormous amount of information provided on these chips has relied on clustering techniques and other standard statistical procedures. These methods, particularly with regard to cancer patient prognosis, have generally been inadequate in providing the reduced gene subsets required for perfect classification. RESULTS: Networks trained on microarray data from DLBCL lymphoma patients have, for the first time, been able to predict the long-term survival of individual patients with 100% accuracy. Other networks were able to distinguish DLBCL lymphoma donors from other donors, including donors with other lymphomas, with 99% accuracy. Differentiating the trained network can narrow the gene profile to less than three dozen genes for each classification. CONCLUSIONS: Here we show that artificial neural networks are a superior tool for digesting microarray data both with regard to making distinctions based on the data and with regard to providing very specific reference as to which genes were most important in making the correct distinction in each case.</description>
    <dc:title>Neural network analysis of lymphoma microarray data: prognosis and diagnosis near-perfect.</dc:title>

    <dc:creator>MC O'Neill</dc:creator>
    <dc:creator>L Song</dc:creator>
    <dc:source>BMC Bioinformatics, Vol. 4, No. 1. (10 April 2003)</dc:source>
    <dc:date>2005-03-09T21:18:33-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>4</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>microarray</prism:category>
    <prism:category>neuralnetwork</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1031417">
    <title>Molecular classification of human cancers using a 92-gene real-time quantitative polymerase chain reaction assay.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1031417</link>
    <description>&lt;i&gt;Arch Pathol Lab Med, Vol. 130, No. 4. (April 2006), pp. 465-473.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;CONTEXT: Correct diagnosis of the tissue origin of a metastatic cancer is the first step in disease management, but it is frequently difficult using standard pathologic methods. Microarray-based gene expression profiling has shown great promise as a new tool to address this challenge. OBJECTIVE: Adoption of microarray technologies in the clinic remains limited. We aimed to bridge this technological gap by developing a real-time quantitative polymerase chain reaction (RT-PCR) assay. DESIGN: We constructed a microarray database of 466 frozen and 112 formalin-fixed, paraffin-embedded (FFPE) samples of both primary and metastatic tumors, measuring expression of 22,000 genes. From the microarray database, we used a genetic algorithm to search for gene combinations optimal for multitumor classification. A 92-gene RT-PCR assay was then designed and used to generate a database for 481 frozen and 119 FFPE tumor samples. RESULTS: The microarray-based K-nearest neighbor classifier demonstrated 84% accuracy in classifying 39 tumor types via cross-validation and 82% accuracy in predicting 112 independent FFPE samples. We successfully translated the microarray database to the RT-PCR platform, which allowed an overall success rate of 87% in classifying 32 different tumor classes in the validation set of 119 FFPE tumor samples. CONCLUSIONS: The RT-PCR-based expression assay involving 92 genes represents a powerful tool for accurately and objectively identifying the site of origin for metastatic tumors, especially in the cases of cancer of unknown primary. The assay uses RT-PCR and routine FFPE samples, making it suitable for rapid clinical adoption.</description>
    <dc:title>Molecular classification of human cancers using a 92-gene real-time quantitative polymerase chain reaction assay.</dc:title>

    <dc:creator>XJ Ma</dc:creator>
    <dc:creator>R Patel</dc:creator>
    <dc:creator>X Wang</dc:creator>
    <dc:creator>R Salunga</dc:creator>
    <dc:creator>J Murage</dc:creator>
    <dc:creator>R Desai</dc:creator>
    <dc:creator>JT Tuggle</dc:creator>
    <dc:creator>W Wang</dc:creator>
    <dc:creator>S Chu</dc:creator>
    <dc:creator>K Stecker</dc:creator>
    <dc:creator>R Raja</dc:creator>
    <dc:creator>H Robin</dc:creator>
    <dc:creator>M Moore</dc:creator>
    <dc:creator>D Baunoch</dc:creator>
    <dc:creator>D Sgroi</dc:creator>
    <dc:creator>M Erlander</dc:creator>
    <dc:source>Arch Pathol Lab Med, Vol. 130, No. 4. (April 2006), pp. 465-473.</dc:source>
    <dc:date>2007-01-09T11:53:16-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Arch Pathol Lab Med</prism:publicationName>
    <prism:issn>1543-2165</prism:issn>
    <prism:volume>130</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>465</prism:startingPage>
    <prism:endingPage>473</prism:endingPage>
    <prism:category>geneticalgorithm</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/597632">
    <title>A systems approach to clinical oncology: Focus on breast cancer</title>
    <link>http://www.citeulike.org/user/macavity1g/article/597632</link>
    <description>&lt;i&gt;Proteome Science, Vol. 4, No. 1. (04 April 2006), 5.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;ABSTRACT: During the past decade, genomic microarrays have been applied with some success to the molecular profiling of breast tumours, which has resulted in a much more detailed classification scheme as well as in the identification of potential gene signature sets. These gene sets have been applied to both the prognosis and prediction of outcome to treatment and have performed better than the current clinical criteria. One of the main limitations of microarray analysis, however, is that frozen tumour samples are required for the assay. This imposes severe limitations on access to samples and impedes large scale validation studies from being conducted. Quantitative reverse transcriptase polymerase chain reaction (qRT-PCR), on the other hand, can be used with degraded RNAs derived from formalin-fixed paraffin-embedded (FFPE) tumour samples, the most important and abundant source of clinical material available. More recently, the novel DASL (cDNA-mediated Annealing, Selection, extension and Ligation) assay has been developed as a high throughput gene expression profiling system specifically designed for use with FFPE tumour tissue samples. However, we do not believe that genomics is adequate as a sole prognostic and predictive platform in breast cancer. The key proteins driving oncogenesis, for example, can undergo post-translational modifications; moreover, if we are ever to move individualization of therapy into the practical world of blood-based assays, serum proteomics becomes critical. Proteomic platforms, including tissue micro-arrays (TMA) and protein chip arrays, in conjunction with surface-enhanced laser desorption ionization time-of-flight mass spectrometry (SELDI-TOF/MS), have been the technologies most widely applied to the characterization of tumours and serum, respectively, from breast cancer patients, with still limited but encouraging results. This review will focus on these genomic and proteomic platforms, with an emphasis placed on the utilization of FFPE tumour tissue samples and serum, as they have been applied to the study of breast cancer for the discovery of gene signatures and biomarkers for the early diagnosis, prognosis and prediction of treatment outcome. The ultimate goal is to be able to apply a systems biology approach to the information gleaned from the utilization of both of these platforms in order to select the best treatment strategy, monitor its effectiveness and make changes as rapidly as possible, where needed, to achieve the optimal therapeutic results for the patient.</description>
    <dc:title>A systems approach to clinical oncology: Focus on breast cancer</dc:title>

    <dc:creator>Mark Abramovitz</dc:creator>
    <dc:creator>Brian Leyland-Jones</dc:creator>
    <dc:identifier>doi:10.1186/1477-5956-4-5</dc:identifier>
    <dc:source>Proteome Science, Vol. 4, No. 1. (04 April 2006), 5.</dc:source>
    <dc:date>2006-04-24T11:24:15-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Proteome Science</prism:publicationName>
    <prism:issn>1477-5956</prism:issn>
    <prism:volume>4</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>5</prism:startingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/994277">
    <title>Integrated breast cancer genomics.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/994277</link>
    <description>&lt;i&gt;Cancer Cell, Vol. 10, No. 6. (December 2006), pp. 453-454.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Predicting survival and therapy responses of breast cancer patients is a significant challenge. Two studies in this issue of Cancer Cell present a novel integrated analysis of genomic and transcriptomic profiles of 145 primary breast cancers and 51 established cell lines. Data from clinical tumors highlighted mechanisms of disease and facilitated identification of potential therapeutic targets and prognostic biomarkers. An extensive well-characterized cancer cell line resource opens up opportunities to explore the determinants of cellular responses to existing and emerging therapies. Taken together, these studies illustrate how integrated molecular profiling may one day significantly impact diagnosis and therapeutic choice in human breast cancer.</description>
    <dc:title>Integrated breast cancer genomics.</dc:title>

    <dc:creator>H Edgren</dc:creator>
    <dc:creator>O Kallioniemi</dc:creator>
    <dc:identifier>doi:10.1016/j.ccr.2006.11.007</dc:identifier>
    <dc:source>Cancer Cell, Vol. 10, No. 6. (December 2006), pp. 453-454.</dc:source>
    <dc:date>2006-12-14T09:51:58-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Cancer Cell</prism:publicationName>
    <prism:issn>1535-6108</prism:issn>
    <prism:volume>10</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>453</prism:startingPage>
    <prism:endingPage>454</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1088407">
    <title>Gene expression profiling for prognosis using Cox regression.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1088407</link>
    <description>&lt;i&gt;Stat Med, Vol. 23, No. 11. (15 June 2004), pp. 1767-1780.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Given the promise of rich biological information in microarray data we will expect an increasing demand for a robust, practical and well-tested methodology to provide patient prognosis based on gene expression data. In standard settings, with few clinical predictors, such a methodology has been provided by the Cox proportional hazard model, but no corresponding methodology is available to deal with the full set of genes in microarray data. Furthermore, we want the procedure to be able to deal with the general survival data that include censored information. Conceptually such a procedure can be constructed quite easily, but its implementation will never be straightforward due to computational problems. We have developed an approach that relies on an extension of the Cox proportional likelihood that allows random effects parameters. In this approach, we use the full set of genes in the analysis and deal with survival data in the most general way. We describe the development of the model and the steps in the implementation, including a fast computational formula based on a subsampling of the risk set and the singular value decomposition. Finally, we illustrate the methodology using a data set obtained from a cohort of breast cancer patients.</description>
    <dc:title>Gene expression profiling for prognosis using Cox regression.</dc:title>

    <dc:creator>Y Pawitan</dc:creator>
    <dc:creator>J Bjöhle</dc:creator>
    <dc:creator>S Wedren</dc:creator>
    <dc:creator>K Humphreys</dc:creator>
    <dc:creator>L Skoog</dc:creator>
    <dc:creator>F Huang</dc:creator>
    <dc:creator>L Amler</dc:creator>
    <dc:creator>P Shaw</dc:creator>
    <dc:creator>P Hall</dc:creator>
    <dc:creator>J Bergh</dc:creator>
    <dc:identifier>doi:10.1002/sim.1769</dc:identifier>
    <dc:source>Stat Med, Vol. 23, No. 11. (15 June 2004), pp. 1767-1780.</dc:source>
    <dc:date>2007-02-05T14:13:58-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Stat Med</prism:publicationName>
    <prism:issn>0277-6715</prism:issn>
    <prism:volume>23</prism:volume>
    <prism:number>11</prism:number>
    <prism:startingPage>1767</prism:startingPage>
    <prism:endingPage>1780</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>cox</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>regression</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/504895">
    <title>Predicting the clinical status of human breast cancer by using gene expression profiles</title>
    <link>http://www.citeulike.org/user/macavity1g/article/504895</link>
    <description>&lt;i&gt;PNAS, Vol. 98, No. 20. (25 September 2001), pp. 11462-11467.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Prognostic and predictive factors are indispensable tools in the treatment of patients with neoplastic disease. For the most part, such factors rely on a few specific cell surface, histological, or gross pathologic features. Gene expression assays have the potential to supplement what were previously a few distinct features with many thousands of features. We have developed Bayesian regression models that provide predictive capability based on gene expression data derived from DNA microarray analysis of a series of primary breast cancer samples. These patterns have the capacity to discriminate breast tumors on the basis of estrogen receptor status and also on the categorized lymph node status. Importantly, we assess the utility and validity of such models in predicting the status of tumors in crossvalidation determinations. The practical value of such approaches relies on the ability not only to assess relative probabilities of clinical outcomes for future samples but also to provide an honest assessment of the uncertainties associated with such predictive classifications on the basis of the selection of gene subsets for each validation analysis. This latter point is of critical importance in the ability to apply these methodologies to clinical assessment of tumor phenotype.</description>
    <dc:title>Predicting the clinical status of human breast cancer by using gene expression profiles</dc:title>

    <dc:creator>Mike West</dc:creator>
    <dc:creator>Carrie Blanchette</dc:creator>
    <dc:creator>Holly Dressman</dc:creator>
    <dc:creator>Erich Huang</dc:creator>
    <dc:creator>Seiichi Ishida</dc:creator>
    <dc:creator>Rainer Spang</dc:creator>
    <dc:creator>Harry Zuzan</dc:creator>
    <dc:creator>John Olson</dc:creator>
    <dc:creator>Jeffrey Marks</dc:creator>
    <dc:creator>Joseph Nevins</dc:creator>
    <dc:identifier>doi:10.1073/pnas.201162998</dc:identifier>
    <dc:source>PNAS, Vol. 98, No. 20. (25 September 2001), pp. 11462-11467.</dc:source>
    <dc:date>2006-02-14T07:50:39-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>PNAS</prism:publicationName>
    <prism:volume>98</prism:volume>
    <prism:number>20</prism:number>
    <prism:startingPage>11462</prism:startingPage>
    <prism:endingPage>11467</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1038480">
    <title>Integration of HapMap-based SNP pattern analysis and gene expression profiling reveals common SNP profiles for cancer therapy outcome predictor genes.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1038480</link>
    <description>&lt;i&gt;Cell Cycle, Vol. 5, No. 22. (November 2006), pp. 2613-2625.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Recent completion of the initial phase of a haplotype map of human genome (www.hapmap.org) provides opportunity for integrative analysis on a genome-wide scale of microarray-based gene expression profiling and SNP variation patterns for discovery of cancer-causing genes and genetic markers of therapy outcome. Here we applied this approach for analysis of SNPs of cancer-associated genes, expression profiles of which predicts the likelihood of treatment failure and death after therapy in patients diagnosed with multiple types of cancer. Unexpectedly, this analysis reveals a common SNP pattern for a majority (60 of 74; 81%) of analyzed cancer treatment outcome predictor (CTOP) genes. Our analysis suggests that heritable germ-line genetic variations driven by geographically localized form of natural selection determining population differentiations may have a significant impact on cancer treatment outcome by influencing the individual's gene expression profile. We demonstrate a translational utility of this approach by building a highly informative CTOP algorithm combining prognostic power of multiple gene expression-based CTOP models derived from signatures of oncogenic pathways associated with activation of BMI1; Myc; Her2/neu; Ras; beta-catenin; Suz12; E2F; and CCND1 oncogenes. Application of a CTOP algorithm to large databases of early-stage breast and prostate tumors identifies cancer patients with 100% probability of a cure with existing cancer therapies as well as patients with nearly 100% likelihood of treatment failure, thus providing a clinically feasible framework essential for introduction of rational evidence-based individualized therapy selection and prescription protocols. Our analysis indicates that genetic determinants of human disease susceptibility and severity are encoded by population differentiation SNP variants. Evolution of these SNPs is driven by geographically-localized form of natural selection causing population differentiation. Recent analysis identifies a class of SNPs regulating gene expression in normal individuals and likely determining unique genome-wide expression profiles of each individual. We propose that critical disease-causing combinations of SNP variants arise from SNPs regulating mRNA levels and determining genome-wide haplotype patterns of individual's disease susceptibility.</description>
    <dc:title>Integration of HapMap-based SNP pattern analysis and gene expression profiling reveals common SNP profiles for cancer therapy outcome predictor genes.</dc:title>

    <dc:creator>GV Glinsky</dc:creator>
    <dc:source>Cell Cycle, Vol. 5, No. 22. (November 2006), pp. 2613-2625.</dc:source>
    <dc:date>2007-01-12T16:54:19-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Cell Cycle</prism:publicationName>
    <prism:issn>1551-4005</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:number>22</prism:number>
    <prism:startingPage>2613</prism:startingPage>
    <prism:endingPage>2625</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>snp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1133608">
    <title>How to best classify breast cancer: conventional and novel classifications (review).</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1133608</link>
    <description>&lt;i&gt;Int J Oncol, Vol. 27, No. 5. (November 2005), pp. 1307-1313.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Breast cancer is a complex disease and different classifications, mostly based on clinical and pathological features, have been used for guiding the management of patients. Most of them fail to reflect breast cancer heterogeneity, which could be the reason why the treatment fails in approximately 30% of cases. Emerging molecular studies based on gene expression profiling using DNA microarrays have defined new molecular subtypes of breast cancer associated with the cell-of-origin distinction. Thus, breast cancer has been divided into five subgroups with distinct biological features and clinical outcomes. We have tried here to confront the conventional existing classifications with this new molecular taxonomy. It is likely that using all types of classification together will help in the management of breast cancer.</description>
    <dc:title>How to best classify breast cancer: conventional and novel classifications (review).</dc:title>

    <dc:creator>E Charafe-Jauffret</dc:creator>
    <dc:creator>C Ginestier</dc:creator>
    <dc:creator>F Monville</dc:creator>
    <dc:creator>S Fekairi</dc:creator>
    <dc:creator>J Jacquemier</dc:creator>
    <dc:creator>D Birnbaum</dc:creator>
    <dc:creator>F Bertucci</dc:creator>
    <dc:source>Int J Oncol, Vol. 27, No. 5. (November 2005), pp. 1307-1313.</dc:source>
    <dc:date>2007-03-01T11:08:29-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Int J Oncol</prism:publicationName>
    <prism:issn>1019-6439</prism:issn>
    <prism:volume>27</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>1307</prism:startingPage>
    <prism:endingPage>1313</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/352759">
    <title>Analysis of recursive gene selection approaches from microarray data.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/352759</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 21, No. 19. (1 October 2005), pp. 3741-3747.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: Finding a small subset of most predictive genes from microarray for disease prediction is a challenging problem. Support vector machines (SVMs) have been found to be successful with a recursive procedure in selecting important genes for cancer prediction. However, it is not well understood how much of the success depends on the choice of the specific classifier and how much on the recursive procedure. We answer this question by examining multiple classifers [SVM, ridge regression (RR) and Rocchio] with feature selection in recursive and non-recursive settings on three DNA microarray datasets (ALL-AML Leukemia data, Breast Cancer data and GCM data). RESULTS: We found recursive RR most effective. On the AML-ALL dataset, it achieved zero error rate on the test set using only three genes (selected from over 7000), which is more encouraging than the best published result (zero error rate using 8 genes by recursive SVM). On the Breast Cancer dataset and the two largest categories of the GCM dataset, the results achieved by recursive RR are also very encouraging. A further analysis of the experimental results shows that different classifiers penalize redundant features to different extent and this property plays an important role in the recursive feature selection process. RR classifier tends to penalize redundant features to a much larger extent than the SVM does. This may be the reason why recursive RR has a better performance in selecting genes. AVAILABILITY: The datasets are available at http://sdmc.lit.org.sg:8080/GEDatasets/Datasets.html/ CONTACT: hustlf@cs.cmu.edu.</description>
    <dc:title>Analysis of recursive gene selection approaches from microarray data.</dc:title>

    <dc:creator>F Li</dc:creator>
    <dc:creator>Y Yang</dc:creator>
    <dc:source>Bioinformatics, Vol. 21, No. 19. (1 October 2005), pp. 3741-3747.</dc:source>
    <dc:date>2005-10-17T12:37:04-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>21</prism:volume>
    <prism:number>19</prism:number>
    <prism:startingPage>3741</prism:startingPage>
    <prism:endingPage>3747</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>svm</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/473090">
    <title>Are data from different gene expression microarray platforms comparable?</title>
    <link>http://www.citeulike.org/user/macavity1g/article/473090</link>
    <description>&lt;i&gt;Genomics, Vol. 83, No. 6. (June 2004), pp. 1164-1168.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Many commercial and custom-made microarray formats are routinely used for large-scale gene expression surveys. Here, we sought to determine the level of concordance between microarray platforms by analyzing breast cancer cell lines with in situ synthesized oligonucleotide arrays (Affymetrix HG-U95v2), commercial cDNA microarrays (Agilent Human 1 cDNA), and custom-made cDNA microarrays from a sequence-validated 13K cDNA library. Gene expression data from the commercial platforms showed good correlations across the experiments (r = 0.78-0.86), whereas the correlations between the custom-made and either of the two commercial platforms were lower (r = 0.62-0.76). Discrepant findings were due to clone errors on the custom-made microarrays, old annotations, or unknown causes. Even within platform, there can be several ways to analyze data that may influence the correlation between platforms. Our results indicate that combining data from different microarray platforms is not straightforward. Variability of the data represents a challenge for developing future diagnostic applications of microarrays.</description>
    <dc:title>Are data from different gene expression microarray platforms comparable?</dc:title>

    <dc:creator>AK Järvinen</dc:creator>
    <dc:creator>S Hautaniemi</dc:creator>
    <dc:creator>H Edgren</dc:creator>
    <dc:creator>P Auvinen</dc:creator>
    <dc:creator>J Saarela</dc:creator>
    <dc:creator>OP Kallioniemi</dc:creator>
    <dc:creator>O Monni</dc:creator>
    <dc:identifier>doi:10.1016/j.ygeno.2004.01.004</dc:identifier>
    <dc:source>Genomics, Vol. 83, No. 6. (June 2004), pp. 1164-1168.</dc:source>
    <dc:date>2006-01-21T05:13:28-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Genomics</prism:publicationName>
    <prism:issn>0888-7543</prism:issn>
    <prism:volume>83</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>1164</prism:startingPage>
    <prism:endingPage>1168</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/447448">
    <title>A gene-expression signature as a predictor of survival in breast cancer.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/447448</link>
    <description>&lt;i&gt;N Engl J Med, Vol. 347, No. 25. (19 December 2002), pp. 1999-2009.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: A more accurate means of prognostication in breast cancer will improve the selection of patients for adjuvant systemic therapy. METHODS: Using microarray analysis to evaluate our previously established 70-gene prognosis profile, we classified a series of 295 consecutive patients with primary breast carcinomas as having a gene-expression signature associated with either a poor prognosis or a good prognosis. All patients had stage I or II breast cancer and were younger than 53 years old; 151 had lymph-node-negative disease, and 144 had lymph-node-positive disease. We evaluated the predictive power of the prognosis profile using univariable and multivariable statistical analyses. RESULTS: Among the 295 patients, 180 had a poor-prognosis signature and 115 had a good-prognosis signature, and the mean (+/-SE) overall 10-year survival rates were 54.6+/-4.4 percent and 94.5+/-2.6 percent, respectively. At 10 years, the probability of remaining free of distant metastases was 50.6+/-4.5 percent in the group with a poor-prognosis signature and 85.2+/-4.3 percent in the group with a good-prognosis signature. The estimated hazard ratio for distant metastases in the group with a poor-prognosis signature, as compared with the group with the good-prognosis signature, was 5.1 (95 percent confidence interval, 2.9 to 9.0; P&#60;0.001). This ratio remained significant when the groups were analyzed according to lymph-node status. Multivariable Cox regression analysis showed that the prognosis profile was a strong independent factor in predicting disease outcome. CONCLUSIONS: The gene-expression profile we studied is a more powerful predictor of the outcome of disease in young patients with breast cancer than standard systems based on clinical and histologic criteria.</description>
    <dc:title>A gene-expression signature as a predictor of survival in breast cancer.</dc:title>

    <dc:creator>MJ van de Vijver</dc:creator>
    <dc:creator>YD He</dc:creator>
    <dc:creator>LJ van't Veer</dc:creator>
    <dc:creator>H Dai</dc:creator>
    <dc:creator>AA Hart</dc:creator>
    <dc:creator>DW Voskuil</dc:creator>
    <dc:creator>GJ Schreiber</dc:creator>
    <dc:creator>JL Peterse</dc:creator>
    <dc:creator>C Roberts</dc:creator>
    <dc:creator>MJ Marton</dc:creator>
    <dc:creator>M Parrish</dc:creator>
    <dc:creator>D Atsma</dc:creator>
    <dc:creator>A Witteveen</dc:creator>
    <dc:creator>A Glas</dc:creator>
    <dc:creator>L Delahaye</dc:creator>
    <dc:creator>T van der Velde</dc:creator>
    <dc:creator>H Bartelink</dc:creator>
    <dc:creator>S Rodenhuis</dc:creator>
    <dc:creator>ET Rutgers</dc:creator>
    <dc:creator>SH Friend</dc:creator>
    <dc:creator>R Bernards</dc:creator>
    <dc:identifier>doi:10.1056/NEJMoa021967</dc:identifier>
    <dc:source>N Engl J Med, Vol. 347, No. 25. (19 December 2002), pp. 1999-2009.</dc:source>
    <dc:date>2005-12-23T03:48:00-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>N Engl J Med</prism:publicationName>
    <prism:issn>1533-4406</prism:issn>
    <prism:volume>347</prism:volume>
    <prism:number>25</prism:number>
    <prism:startingPage>1999</prism:startingPage>
    <prism:endingPage>2009</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1090877">
    <title>Identifying gene expression changes in breast cancer that distinguish early and late relapse among uncured patients.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1090877</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 12. (15 June 2006), pp. 1477-1485.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: In recent years, microarray technology has revealed many tumor-expressed genes prognostic of clinical outcomes in early-stage breast cancer patients. However, in the presence of cured patients, evaluating gene effect on time to relapse is quite complex since it may affect either the probability of never experiencing a relapse (cure effect) or the time to relapse among the uncured patients (disease progression effect) or both. In this context, we propose a simple and an efficient method for identifying gene expression changes that characterize early and late recurrence for uncured patients. RESULTS: Simulation results show the good performance of the proposed statistic for detecting a disease progression effect. In a study of early-stage breast cancer, our results show that the proposed statistic provides a more powerful basis for gene selection than the classical Cox model-based statistic. From a biological perspective, many of the genes identified here as associated with the speed of disease recurrence have known roles in tumorigenesis.</description>
    <dc:title>Identifying gene expression changes in breast cancer that distinguish early and late relapse among uncured patients.</dc:title>

    <dc:creator>P Broët</dc:creator>
    <dc:creator>VA Kuznetsov</dc:creator>
    <dc:creator>J Bergh</dc:creator>
    <dc:creator>ET Liu</dc:creator>
    <dc:creator>LD Miller</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 12. (15 June 2006), pp. 1477-1485.</dc:source>
    <dc:date>2007-02-06T16:57:34-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>12</prism:number>
    <prism:startingPage>1477</prism:startingPage>
    <prism:endingPage>1485</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/927698">
    <title>PACK: Profile Analysis using Clustering and Kurtosis to find molecular classifiers in cancer.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/927698</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 18. (15 September 2006), pp. 2269-2275.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: Elucidating the molecular taxonomy of cancers and finding biological and clinical markers from microarray experiments is problematic due to the large number of variables being measured. Feature selection methods that can identify relevant classifiers or that can remove likely false positives prior to supervised analysis are therefore desirable. RESULTS: We present a novel feature selection procedure based on a mixture model and a non-gaussianity measure of a gene's expression profile. The method can be used to find genes that define either small outlier subgroups or major subdivisions, depending on the sign of kurtosis. The method can also be used as a filtering step, prior to supervised analysis, in order to reduce the false discovery rate. We validate our methodology using six independent datasets by rediscovering major classifiers in ER negative and ER positive breast cancer and in prostate cancer. Furthermore, our method finds two novel subtypes within the basal subgroup of ER negative breast tumours, associated with apoptotic and immune response functions respectively, and with statistically different clinical outcome. AVAILABILITY: An R-function pack that implements the methods used here has been added to vabayelMix, available from (www.cran.r-project.org). CONTACT: aet21@cam.ac.uk SUPPLEMENTARY INFORMATION: Supplementary information is available at Bioinformatics online.</description>
    <dc:title>PACK: Profile Analysis using Clustering and Kurtosis to find molecular classifiers in cancer.</dc:title>

    <dc:creator>AE Teschendorff</dc:creator>
    <dc:creator>A Naderi</dc:creator>
    <dc:creator>NL Barbosa-Morais</dc:creator>
    <dc:creator>C Caldas</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 18. (15 September 2006), pp. 2269-2275.</dc:source>
    <dc:date>2006-11-03T17:24:09-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1460-2059</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>18</prism:number>
    <prism:startingPage>2269</prism:startingPage>
    <prism:endingPage>2275</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>kurtosis</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1133679">
    <title>A mouse stromal response to tumor invasion predicts prostate and breast cancer patient survival.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1133679</link>
    <description>&lt;i&gt;PLoS ONE, Vol. 1 (2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Primary and metastatic tumor growth induces host tissue responses that are believed to support tumor progression. Understanding the molecular changes within the tumor microenvironment during tumor progression may therefore be relevant not only for discovering potential therapeutic targets, but also for identifying putative molecular signatures that may improve tumor classification and predict clinical outcome. To selectively address stromal gene expression changes during cancer progression, we performed cDNA microarray analysis of laser-microdissected stromal cells derived from prostate intraepithelial neoplasia (PIN) and invasive cancer in a multistage model of prostate carcinogenesis. Human orthologs of genes identified in the stromal reaction to tumor progression in this mouse model were observed to be expressed in several human cancers, and to cluster prostate and breast cancer patients into groups with statistically different clinical outcomes. Univariate Cox analysis showed that overexpression of these genes is associated with shorter survival and recurrence-free periods. Taken together, our observations provide evidence that the expression signature of the stromal response to tumor invasion in a mouse tumor model can be used to probe human cancer, and to provide a powerful prognostic indicator for some of the most frequent human malignancies.</description>
    <dc:title>A mouse stromal response to tumor invasion predicts prostate and breast cancer patient survival.</dc:title>

    <dc:creator>M Bacac</dc:creator>
    <dc:creator>P Provero</dc:creator>
    <dc:creator>N Mayran</dc:creator>
    <dc:creator>JC Stehle</dc:creator>
    <dc:creator>C Fusco</dc:creator>
    <dc:creator>I Stamenkovic</dc:creator>
    <dc:identifier>doi:10.1371/journal.pone.0000032</dc:identifier>
    <dc:source>PLoS ONE, Vol. 1 (2006)</dc:source>
    <dc:date>2007-03-01T11:56:43-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>PLoS ONE</prism:publicationName>
    <prism:issn>1932-6203</prism:issn>
    <prism:volume>1</prism:volume>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1133459">
    <title>Computational exploration of the activated pathways associated with DNA damage response in breast cancer.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1133459</link>
    <description>&lt;i&gt;Proteins, Vol. 65, No. 1. (1 October 2006), pp. 103-110.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Molecular signaling events regulate cellular activity. Cancer stimulating signals trigger cellular responses that evade the regulatory control of cell development. To understand the mechanism of signaling regulation in cancer, it is necessary to identify the activated pathways in cancer. We have developed RepairPATH, a computational algorithm that explores the activated signaling pathways in cancer. The RepairPATH integrates RepairNET, an assembled protein interaction network associated with DNA damage response, with the gene expression profiles derived from the microarray data. Based on the observation that cofunctional proteins often exhibit correlated gene expression profiles, it identifies the activated signaling pathways in cancer by systematically searching the RepairNET for proteins with significantly correlated gene expression profiles. Analyzing the gene expression profiles of breast cancer, we found distinct similarities and differences in the activated signaling pathways between the samples from the patients who developed metastases and the samples from the patients who were disease free within 5 years. The cellular pathways associated with the various DNA repair mechanisms and the cell-cycle checkpoint controls are found to be activated in both sample groups. One of the most intriguing findings is that the pathways associated with different cellular processes are functionally coordinated through BRCA1 in the disease-free sample group, whereas such functional coordination is absent in the samples from patients who developed metastases. Our analysis revealed the potential cellular pathways that regulate the signaling events in breast cancer.</description>
    <dc:title>Computational exploration of the activated pathways associated with DNA damage response in breast cancer.</dc:title>

    <dc:creator>L Wen</dc:creator>
    <dc:creator>W Li</dc:creator>
    <dc:creator>M Sobel</dc:creator>
    <dc:creator>JA Feng</dc:creator>
    <dc:identifier>doi:10.1002/prot.21064</dc:identifier>
    <dc:source>Proteins, Vol. 65, No. 1. (1 October 2006), pp. 103-110.</dc:source>
    <dc:date>2007-03-01T10:29:36-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Proteins</prism:publicationName>
    <prism:issn>1097-0134</prism:issn>
    <prism:volume>65</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>103</prism:startingPage>
    <prism:endingPage>110</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1052952">
    <title>The molecular portraits of breast tumors are conserved across microarray platforms.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1052952</link>
    <description>&lt;i&gt;BMC Genomics, Vol. 7 (2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Validation of a novel gene expression signature in independent data sets is a critical step in the development of a clinically useful test for cancer patient risk-stratification. However, validation is often unconvincing because the size of the test set is typically small. To overcome this problem we used publicly available breast cancer gene expression data sets and a novel approach to data fusion, in order to validate a new breast tumor intrinsic list. RESULTS: A 105-tumor training set containing 26 sample pairs was used to derive a new breast tumor intrinsic gene list. This intrinsic list contained 1300 genes and a proliferation signature that was not present in previous breast intrinsic gene sets. We tested this list as a survival predictor on a data set of 311 tumors compiled from three independent microarray studies that were fused into a single data set using Distance Weighted Discrimination. When the new intrinsic gene set was used to hierarchically cluster this combined test set, tumors were grouped into LumA, LumB, Basal-like, HER2+/ER-, and Normal Breast-like tumor subtypes that we demonstrated in previous datasets. These subtypes were associated with significant differences in Relapse-Free and Overall Survival. Multivariate Cox analysis of the combined test set showed that the intrinsic subtype classifications added significant prognostic information that was independent of standard clinical predictors. From the combined test set, we developed an objective and unchanging classifier based upon five intrinsic subtype mean expression profiles (i.e. centroids), which is designed for single sample predictions (SSP). The SSP approach was applied to two additional independent data sets and consistently predicted survival in both systemically treated and untreated patient groups. CONCLUSION: This study validates the &#34;breast tumor intrinsic&#34; subtype classification as an objective means of tumor classification that should be translated into a clinical assay for further retrospective and prospective validation. In addition, our method of combining existing data sets can be used to robustly validate the potential clinical value of any new gene expression profile.</description>
    <dc:title>The molecular portraits of breast tumors are conserved across microarray platforms.</dc:title>

    <dc:creator>Z Hu</dc:creator>
    <dc:creator>C Fan</dc:creator>
    <dc:creator>DS Oh</dc:creator>
    <dc:creator>JS Marron</dc:creator>
    <dc:creator>X He</dc:creator>
    <dc:creator>BF Qaqish</dc:creator>
    <dc:creator>C Livasy</dc:creator>
    <dc:creator>LA Carey</dc:creator>
    <dc:creator>E Reynolds</dc:creator>
    <dc:creator>L Dressler</dc:creator>
    <dc:creator>A Nobel</dc:creator>
    <dc:creator>J Parker</dc:creator>
    <dc:creator>MG Ewend</dc:creator>
    <dc:creator>LR Sawyer</dc:creator>
    <dc:creator>J Wu</dc:creator>
    <dc:creator>Y Liu</dc:creator>
    <dc:creator>R Nanda</dc:creator>
    <dc:creator>M Tretiakova</dc:creator>
    <dc:creator>A Ruiz Orrico</dc:creator>
    <dc:creator>D Dreher</dc:creator>
    <dc:creator>JP Palazzo</dc:creator>
    <dc:creator>L Perreard</dc:creator>
    <dc:creator>E Nelson</dc:creator>
    <dc:creator>M Mone</dc:creator>
    <dc:creator>H Hansen</dc:creator>
    <dc:creator>M Mullins</dc:creator>
    <dc:creator>JF Quackenbush</dc:creator>
    <dc:creator>MJ Ellis</dc:creator>
    <dc:creator>OI Olopade</dc:creator>
    <dc:creator>PS Bernard</dc:creator>
    <dc:creator>CM Perou</dc:creator>
    <dc:identifier>doi:10.1186/1471-2164-7-96</dc:identifier>
    <dc:source>BMC Genomics, Vol. 7 (2006)</dc:source>
    <dc:date>2007-01-19T15:13:16-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Genomics</prism:publicationName>
    <prism:issn>1471-2164</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/591480">
    <title>Cancer classification and prediction using logistic regression with Bayesian gene selection.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/591480</link>
    <description>&lt;i&gt;J Biomed Inform, Vol. 37, No. 4. (August 2004), pp. 249-259.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In microarray-based cancer classification and prediction, gene selection is an important research problem owing to the large number of genes and the small number of experimental conditions. In this paper, we propose a Bayesian approach to gene selection and classification using the logistic regression model. The basic idea of our approach is in conjunction with a logistic regression model to relate the gene expression with the class labels. We use Gibbs sampling and Markov chain Monte Carlo (MCMC) methods to discover important genes. To implement Gibbs Sampler and MCMC search, we derive a posterior distribution of selected genes given the observed data. After the important genes are identified, the same logistic regression model is then used for cancer classification and prediction. Issues for efficient implementation for the proposed method are discussed. The proposed method is evaluated against several large microarray data sets, including hereditary breast cancer, small round blue-cell tumors, and acute leukemia. The results show that the method can effectively identify important genes consistent with the known biological findings while the accuracy of the classification is also high. Finally, the robustness and sensitivity properties of the proposed method are also investigated.</description>
    <dc:title>Cancer classification and prediction using logistic regression with Bayesian gene selection.</dc:title>

    <dc:creator>X Zhou</dc:creator>
    <dc:creator>KY Liu</dc:creator>
    <dc:creator>ST Wong</dc:creator>
    <dc:identifier>doi:10.1016/j.jbi.2004.07.009</dc:identifier>
    <dc:source>J Biomed Inform, Vol. 37, No. 4. (August 2004), pp. 249-259.</dc:source>
    <dc:date>2006-04-19T23:42:23-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>J Biomed Inform</prism:publicationName>
    <prism:issn>1532-0464</prism:issn>
    <prism:volume>37</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>249</prism:startingPage>
    <prism:endingPage>259</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>logisticregression</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1152294">
    <title>Prognostic meta-signature of breast cancer developed by two-stage mixture modeling of microarray data.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1152294</link>
    <description>&lt;i&gt;BMC Genomics, Vol. 5, No. 1. (2004)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: An increasing number of studies have profiled tumor specimens using distinct microarray platforms and analysis techniques. With the accumulating amount of microarray data, one of the most intriguing yet challenging tasks is to develop robust statistical models to integrate the findings. RESULTS: By applying a two-stage Bayesian mixture modeling strategy, we were able to assimilate and analyze four independent microarray studies to derive an inter-study validated &#34;meta-signature&#34; associated with breast cancer prognosis. Combining multiple studies (n = 305 samples) on a common probability scale, we developed a 90-gene meta-signature, which strongly associated with survival in breast cancer patients. Given the set of independent studies using different microarray platforms which included spotted cDNAs, Affymetrix GeneChip, and inkjet oligonucleotides, the individually identified classifiers yielded gene sets predictive of survival in each study cohort. The study-specific gene signatures, however, had minimal overlap with each other, and performed poorly in pairwise cross-validation. The meta-signature, on the other hand, accommodated such heterogeneity and achieved comparable or better prognostic performance when compared with the individual signatures. Further by comparing to a global standardization method, the mixture model based data transformation demonstrated superior properties for data integration and provided solid basis for building classifiers at the second stage. Functional annotation revealed that genes involved in cell cycle and signal transduction activities were over-represented in the meta-signature. CONCLUSION: The mixture modeling approach unifies disparate gene expression data on a common probability scale allowing for robust, inter-study validated prognostic signatures to be obtained. With the emerging utility of microarrays for cancer prognosis, it will be important to establish paradigms to meta-analyze disparate gene expression data for prognostic signatures of potential clinical use.</description>
    <dc:title>Prognostic meta-signature of breast cancer developed by two-stage mixture modeling of microarray data.</dc:title>

    <dc:creator>R Shen</dc:creator>
    <dc:creator>D Ghosh</dc:creator>
    <dc:creator>AM Chinnaiyan</dc:creator>
    <dc:identifier>doi:10.1186/1471-2164-5-94</dc:identifier>
    <dc:source>BMC Genomics, Vol. 5, No. 1. (2004)</dc:source>
    <dc:date>2007-03-10T01:00:37-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>BMC Genomics</prism:publicationName>
    <prism:issn>1471-2164</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/825696">
    <title>Predicting the prognosis of breast cancer by integrating clinical and microarray data with Bayesian networks.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/825696</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 14. (15 July 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: Clinical data, such as patient history, laboratory analysis, ultrasound parameters-which are the basis of day-to-day clinical decision support-are often underused to guide the clinical management of cancer in the presence of microarray data. We propose a strategy based on Bayesian networks to treat clinical and microarray data on an equal footing. The main advantage of this probabilistic model is that it allows to integrate these data sources in several ways and that it allows to investigate and understand the model structure and parameters. Furthermore using the concept of a Markov Blanket we can identify all the variables that shield off the class variable from the influence of the remaining network. Therefore Bayesian networks automatically perform feature selection by identifying the (in)dependency relationships with the class variable. RESULTS: We evaluated three methods for integrating clinical and microarray data: decision integration, partial integration and full integration and used them to classify publicly available data on breast cancer patients into a poor and a good prognosis group. The partial integration method is most promising and has an independent test set area under the ROC curve of 0.845. After choosing an operating point the classification performance is better than frequently used indices. CONTACT: olivier.gevaert@esat.kuleuven.be.</description>
    <dc:title>Predicting the prognosis of breast cancer by integrating clinical and microarray data with Bayesian networks.</dc:title>

    <dc:creator>O Gevaert</dc:creator>
    <dc:creator>FD Smet</dc:creator>
    <dc:creator>D Timmerman</dc:creator>
    <dc:creator>Y Moreau</dc:creator>
    <dc:creator>BD Moor</dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/btl230</dc:identifier>
    <dc:source>Bioinformatics, Vol. 22, No. 14. (15 July 2006)</dc:source>
    <dc:date>2006-09-02T10:48:52-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1460-2059</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>14</prism:number>
    <prism:category>bayesian</prism:category>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>network</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/504893">
    <title>Gene expression patterns of breast carcinomas distinguish tumor subclasses with clinical implications</title>
    <link>http://www.citeulike.org/user/macavity1g/article/504893</link>
    <description>&lt;i&gt;PNAS, Vol. 98, No. 19. (11 September 2001), pp. 10869-10874.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The purpose of this study was to classify breast carcinomas based on variations in gene expression patterns derived from cDNA microarrays and to correlate tumor characteristics to clinical outcome. A total of 85 cDNA microarray experiments representing 78 cancers, three fibroadenomas, and four normal breast tissues were analyzed by hierarchical clustering. As reported previously, the cancers could be classified into a basal epithelial-like group, an ERBB2-overexpressing group and a normal breast-like group based on variations in gene expression. A novel finding was that the previously characterized luminal epithelial/estrogen receptor-positive group could be divided into at least two subgroups, each with a distinctive expression profile. These subtypes proved to be reasonably robust by clustering using two different gene sets: first, a set of 456 cDNA clones previously selected to reflect intrinsic properties of the tumors and, second, a gene set that highly correlated with patient outcome. Survival analyses on a subcohort of patients with locally advanced breast cancer uniformly treated in a prospective study showed significantly different outcomes for the patients belonging to the various groups, including a poor prognosis for the basal-like subtype and a significant difference in outcome for the two estrogen receptor-positive groups.</description>
    <dc:title>Gene expression patterns of breast carcinomas distinguish tumor subclasses with clinical implications</dc:title>

    <dc:creator>Therese Sorlie</dc:creator>
    <dc:creator>Charles Perou</dc:creator>
    <dc:creator>Robert Tibshirani</dc:creator>
    <dc:creator>Turid Aas</dc:creator>
    <dc:creator>Stephanie Geisler</dc:creator>
    <dc:creator>Hilde Johnsen</dc:creator>
    <dc:creator>Trevor Hastie</dc:creator>
    <dc:creator>Michael Eisen</dc:creator>
    <dc:creator>Matt van de Rijn</dc:creator>
    <dc:creator>Stefanie Jeffrey</dc:creator>
    <dc:creator>Thor Thorsen</dc:creator>
    <dc:creator>Hanne Quist</dc:creator>
    <dc:creator>John Matese</dc:creator>
    <dc:creator>Patrick Brown</dc:creator>
    <dc:creator>David Botstein</dc:creator>
    <dc:creator>Per Lonning</dc:creator>
    <dc:creator>Anne-Lise Borresen-Dale</dc:creator>
    <dc:identifier>doi:10.1073/pnas.191367098</dc:identifier>
    <dc:source>PNAS, Vol. 98, No. 19. (11 September 2001), pp. 10869-10874.</dc:source>
    <dc:date>2006-02-14T07:48:49-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>PNAS</prism:publicationName>
    <prism:volume>98</prism:volume>
    <prism:number>19</prism:number>
    <prism:startingPage>10869</prism:startingPage>
    <prism:endingPage>10874</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1030057">
    <title>Nonparametric pathway-based regression models for analysis of genomic data.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1030057</link>
    <description>&lt;i&gt;Biostatistics (13 June 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;High-throughout genomic data provide an opportunity for identifying pathways and genes that are related to various clinical phenotypes. Besides these genomic data, another valuable source of data is the biological knowledge about genes and pathways that might be related to the phenotypes of many complex diseases. Databases of such knowledge are often called the metadata. In microarray data analysis, such metadata are currently explored in post hoc ways by gene set enrichment analysis but have hardly been utilized in the modeling step. We propose to develop and evaluate a pathway-based gradient descent boosting procedure for nonparametric pathways-based regression (NPR) analysis to efficiently integrate genomic data and metadata. Such NPR models consider multiple pathways simultaneously and allow complex interactions among genes within the pathways and can be applied to identify pathways and genes that are related to variations of the phenotypes. These methods also provide an alternative to mediating the problem of a large number of potential interactions by limiting analysis to biologically plausible interactions between genes in related pathways. Our simulation studies indicate that the proposed boosting procedure can indeed identify relevant pathways. Application to a gene expression data set on breast cancer distant metastasis identified that Wnt, apoptosis and cell cycle regulated pathways are more likely related to the risk of distant metastasis among lymph-node-negative breast cancer patients. Results from analysis of other two breast cancer gene expression data sets indicate that the pathways of Metalloendopeptidases (MMPs) and MMP inhibitors, as well as cell proliferation, cell growth and maintenance are important to breast cancer relapse and survival. We also observed that by incorporating the pathway information, we achieved better prediction for cancer recurrence.</description>
    <dc:title>Nonparametric pathway-based regression models for analysis of genomic data.</dc:title>

    <dc:creator>Zhi Wei</dc:creator>
    <dc:creator>Hongzhe Li</dc:creator>
    <dc:source>Biostatistics (13 June 2006)</dc:source>
    <dc:date>2007-01-08T12:08:24-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Biostatistics</prism:publicationName>
    <prism:issn>1465-4644</prism:issn>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>regression</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/504894">
    <title>Gene expression profiling predicts clinical outcome of breast cancer.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/504894</link>
    <description>&lt;i&gt;Nature, Vol. 415, No. 6871. (31 January 2002), pp. 530-536.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Breast cancer patients with the same stage of disease can have markedly different treatment responses and overall outcome. The strongest predictors for metastases (for example, lymph node status and histological grade) fail to classify accurately breast tumours according to their clinical behaviour. Chemotherapy or hormonal therapy reduces the risk of distant metastases by approximately one-third; however, 70-80% of patients receiving this treatment would have survived without it. None of the signatures of breast cancer gene expression reported to date allow for patient-tailored therapy strategies. Here we used DNA microarray analysis on primary breast tumours of 117 young patients, and applied supervised classification to identify a gene expression signature strongly predictive of a short interval to distant metastases ('poor prognosis' signature) in patients without tumour cells in local lymph nodes at diagnosis (lymph node negative). In addition, we established a signature that identifies tumours of BRCA1 carriers. The poor prognosis signature consists of genes regulating cell cycle, invasion, metastasis and angiogenesis. This gene expression profile will outperform all currently used clinical parameters in predicting disease outcome. Our findings provide a strategy to select patients who would benefit from adjuvant therapy.</description>
    <dc:title>Gene expression profiling predicts clinical outcome of breast cancer.</dc:title>

    <dc:creator>LJ van 't Veer</dc:creator>
    <dc:creator>H Dai</dc:creator>
    <dc:creator>MJ van de Vijver</dc:creator>
    <dc:creator>YD He</dc:creator>
    <dc:creator>AA Hart</dc:creator>
    <dc:creator>M Mao</dc:creator>
    <dc:creator>HL Peterse</dc:creator>
    <dc:creator>K van der Kooy</dc:creator>
    <dc:creator>MJ Marton</dc:creator>
    <dc:creator>AT Witteveen</dc:creator>
    <dc:creator>GJ Schreiber</dc:creator>
    <dc:creator>RM Kerkhoven</dc:creator>
    <dc:creator>C Roberts</dc:creator>
    <dc:creator>PS Linsley</dc:creator>
    <dc:creator>R Bernards</dc:creator>
    <dc:creator>SH Friend</dc:creator>
    <dc:identifier>doi:10.1038/415530a</dc:identifier>
    <dc:source>Nature, Vol. 415, No. 6871. (31 January 2002), pp. 530-536.</dc:source>
    <dc:date>2006-02-14T07:49:54-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:issn>0028-0836</prism:issn>
    <prism:volume>415</prism:volume>
    <prism:number>6871</prism:number>
    <prism:startingPage>530</prism:startingPage>
    <prism:endingPage>536</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/547897">
    <title>Singular value decomposition regression models for classification of tumors from microarray experiments.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/547897</link>
    <description>&lt;i&gt;Pac Symp Biocomput (2002), pp. 18-29.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;An important problem in the analysis of microarray data is correlating the high-dimensional measurements with clinical phenotypes. In this paper, we develop predictive models for associating gene expression data from microarray experiments with such outcomes. They are based on the singular value decomposition. We propose new algorithms for performing gene selection and gene clustering based on these predictive models. The estimation procedure using the regression models occurs in two stages. First, the gene expression measurements are transformed using the singular value decomposition. The regression parameters in the model linking the principal components with the clinical responses are then estimated using maximum likelihood. We demonstrate the application of the methodology to data from a breast cancer study.</description>
    <dc:title>Singular value decomposition regression models for classification of tumors from microarray experiments.</dc:title>

    <dc:creator>D Ghosh</dc:creator>
    <dc:source>Pac Symp Biocomput (2002), pp. 18-29.</dc:source>
    <dc:date>2006-03-11T14:57:30-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Pac Symp Biocomput</prism:publicationName>
    <prism:startingPage>18</prism:startingPage>
    <prism:endingPage>29</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1052789">
    <title>Gene expression profiling identifies molecular subtypes of inflammatory breast cancer.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1052789</link>
    <description>&lt;i&gt;Cancer Res, Vol. 65, No. 6. (15 March 2005), pp. 2170-2178.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Breast cancer is a heterogeneous disease. Comprehensive gene expression profiles obtained using DNA microarrays have revealed previously indistinguishable subtypes of noninflammatory breast cancer (NIBC) related to different features of mammary epithelial biology and significantly associated with survival. Inflammatory breast cancer (IBC) is a rare, particular, and aggressive form of disease. Here we have investigated whether the five molecular subtypes described for NIBC (luminal A and B, basal, ERBB2 overexpressing, and normal breast-like) were also present in IBC. We monitored the RNA expression of approximately 8,000 genes in 83 breast tissue samples including 37 IBC, 44 NIBC, and 2 normal breast samples. Hierarchical clustering identified the five subtypes of breast cancer in both NIBC and IBC samples. These subtypes were highly similar to those defined in previous studies and associated with similar histoclinical features. The robustness of this classification was confirmed by the use of both alternative gene set and analysis method, and the results were corroborated at the protein level. Furthermore, we show that the differences in gene expression between NIBC and IBC and between IBC with and without pathologic complete response that we have recently reported persist in each subtype. Our results show that the expression signatures defining molecular subtypes of NIBC are also present in IBC. Obtained using different patient series and different microarray platforms, they reinforce confidence in the expression-based molecular taxonomy but also give evidence for its universality in breast cancer, independently of a specific clinical form.</description>
    <dc:title>Gene expression profiling identifies molecular subtypes of inflammatory breast cancer.</dc:title>

    <dc:creator>F Bertucci</dc:creator>
    <dc:creator>P Finetti</dc:creator>
    <dc:creator>J Rougemont</dc:creator>
    <dc:creator>E Charafe-Jauffret</dc:creator>
    <dc:creator>N Cervera</dc:creator>
    <dc:creator>C Tarpin</dc:creator>
    <dc:creator>C Nguyen</dc:creator>
    <dc:creator>L Xerri</dc:creator>
    <dc:creator>R Houlgatte</dc:creator>
    <dc:creator>J Jacquemier</dc:creator>
    <dc:creator>P Viens</dc:creator>
    <dc:creator>D Birnbaum</dc:creator>
    <dc:identifier>doi:10.1158/0008-5472.CAN-04-4115</dc:identifier>
    <dc:source>Cancer Res, Vol. 65, No. 6. (15 March 2005), pp. 2170-2178.</dc:source>
    <dc:date>2007-01-19T14:55:51-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Cancer Res</prism:publicationName>
    <prism:issn>0008-5472</prism:issn>
    <prism:volume>65</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>2170</prism:startingPage>
    <prism:endingPage>2178</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1152288">
    <title>Gene signature evaluation as a prognostic tool: challenges in the design of the MINDACT trial.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1152288</link>
    <description>&lt;i&gt;Nat Clin Pract Oncol, Vol. 3, No. 10. (October 2006), pp. 540-551.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This Review describes the work conducted by the TRANSBIG consortium in the development of the MINDACT (Microarray In Node negative Disease may Avoid ChemoTherapy) trial. The goal of the trial is to provide definitive evidence regarding the clinical relevance of the 70-gene prognosis signature, and to assess the performance of this signature compared with that of traditional prognostic indicators for assigning adjuvant chemotherapy to patients with node-negative breast cancer. We outline the background work and the key questions in node-negative early-stage breast cancer, and then focus on the MINDACT trial design and statistical considerations. The challenges inherent in this trial in terms of logistics, implementation and interpretation of the results are also discussed. We hope that this article will trigger further discussion about the difficulties of setting up and analyzing trials aimed at establishing the worth of new methods for better selection of patients for cancer treatment.</description>
    <dc:title>Gene signature evaluation as a prognostic tool: challenges in the design of the MINDACT trial.</dc:title>

    <dc:creator>J Bogaerts</dc:creator>
    <dc:creator>F Cardoso</dc:creator>
    <dc:creator>M Buyse</dc:creator>
    <dc:creator>S Braga</dc:creator>
    <dc:creator>S Loi</dc:creator>
    <dc:creator>JA Harrison</dc:creator>
    <dc:creator>J Bines</dc:creator>
    <dc:creator>S Mook</dc:creator>
    <dc:creator>N Decker</dc:creator>
    <dc:creator>P Ravdin</dc:creator>
    <dc:creator>P Therasse</dc:creator>
    <dc:creator>E Rutgers</dc:creator>
    <dc:creator>LJ van 't Veer</dc:creator>
    <dc:creator>M Piccart</dc:creator>
    <dc:creator></dc:creator>
    <dc:identifier>doi:10.1038/ncponc0591</dc:identifier>
    <dc:source>Nat Clin Pract Oncol, Vol. 3, No. 10. (October 2006), pp. 540-551.</dc:source>
    <dc:date>2007-03-10T00:55:12-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Nat Clin Pract Oncol</prism:publicationName>
    <prism:issn>1743-4262</prism:issn>
    <prism:volume>3</prism:volume>
    <prism:number>10</prism:number>
    <prism:startingPage>540</prism:startingPage>
    <prism:endingPage>551</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1023353">
    <title>Large scale data mining approach for gene-specific standardization of microarray gene expression data.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1023353</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 23. (1 December 2006), pp. 2898-2904.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: The identification of the change of gene expression in multifactorial diseases, such as breast cancer is a major goal of DNA microarray experiments. Here we present a new data mining strategy to better analyze the marginal difference in gene expression between microarray samples. The idea is based on the notion that the consideration of gene's behavior in a wide variety of experiments can improve the statistical reliability on identifying genes with moderate changes between samples. RESULTS: The availability of a large collection of array samples sharing the same platform in public databases, such as NCBI GEO, enabled us to re-standardize the expression intensity of a gene using its mean and variation in the wide variety of experimental conditions. This approach was evaluated via the re-identification of breast cancer-specific gene expression. It successfully prioritized several genes associated with breast tumor, for which the expression difference between normal and breast cancer cells was marginal and thus would have been difficult to recognize using conventional analysis methods. Maximizing the utility of microarray data in the public database, it provides a valuable tool particularly for the identification of previously unrecognized disease-related genes. AVAILABILITY: A user friendly web-interface (http://compbio.sookmyung.ac.kr/~lage/) was constructed to provide the present large-scale approach for the analysis of GEO microarray data (GS-LAGE server).</description>
    <dc:title>Large scale data mining approach for gene-specific standardization of microarray gene expression data.</dc:title>

    <dc:creator>S Yoon</dc:creator>
    <dc:creator>Y Yang</dc:creator>
    <dc:creator>J Choi</dc:creator>
    <dc:creator>J Seong</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 23. (1 December 2006), pp. 2898-2904.</dc:source>
    <dc:date>2007-01-03T15:58:05-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1460-2059</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>23</prism:number>
    <prism:startingPage>2898</prism:startingPage>
    <prism:endingPage>2904</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/911311">
    <title>Molecular classification and molecular forecasting of breast cancer: ready for clinical application?</title>
    <link>http://www.citeulike.org/user/macavity1g/article/911311</link>
    <description>&lt;i&gt;J Clin Oncol, Vol. 23, No. 29. (10 October 2005), pp. 7350-7360.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Profiling breast cancer with expression arrays has become common, and it has been suggested that the results from early studies will lead to understanding of the molecular differences between clinical cases and allow individualization of care. We critically review two main applications of expression profiling; studies unraveling novel breast cancer classifications and those that aim to identify novel markers for prediction of clinical outcome. Breast cancer may now be subclassified into luminal, basal, and HER2 subtypes with distinct differences in prognosis and response to therapy. However, profiling studies to identify predictive markers have suffered from methodologic problems that prevent general application of their results. Future work will need to reanalyze existing microarray data sets to identify more representative sets of candidate genes for use as prognostic signatures and will need to take into account the new knowledge of molecular subtypes of breast cancer when assessing predictive effects.</description>
    <dc:title>Molecular classification and molecular forecasting of breast cancer: ready for clinical application?</dc:title>

    <dc:creator>JD Brenton</dc:creator>
    <dc:creator>LA Carey</dc:creator>
    <dc:creator>AA Ahmed</dc:creator>
    <dc:creator>C Caldas</dc:creator>
    <dc:identifier>doi:10.1200/JCO.2005.03.3845</dc:identifier>
    <dc:source>J Clin Oncol, Vol. 23, No. 29. (10 October 2005), pp. 7350-7360.</dc:source>
    <dc:date>2006-10-24T17:12:03-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>J Clin Oncol</prism:publicationName>
    <prism:issn>0732-183X</prism:issn>
    <prism:volume>23</prism:volume>
    <prism:number>29</prism:number>
    <prism:startingPage>7350</prism:startingPage>
    <prism:endingPage>7360</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/1075871">
    <title>Classification of human breast cancer using gene expression profiling as a component of the survival predictor algorithm.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/1075871</link>
    <description>&lt;i&gt;Clin Cancer Res, Vol. 10, No. 7. (1 April 2004), pp. 2272-2283.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;PURPOSE: Selection of treatment options with the highest likelihood of successful outcome for individual breast cancer patients is based to a large degree on accurate classification into subgroups with poor and good prognosis reflecting a different probability of disease recurrence and survival after therapy. Here we propose a breast cancer classification algorithm taking into account three main prognostic features determined at the time of diagnosis: estrogen receptor (ER) status; lymph node (LN) status; and gene expression signatures associated with distinct therapy outcome. EXPERIMENTAL DESIGN: Using microarray expression profiling and quantitative reverse transcription-PCR analyses, we compared expression profiles of the 70-gene breast cancer survival signature in established breast cancer cell lines and primary breast carcinomas from cancer patients. We classified 295 breast cancer patients using 14-, 13-, 6-, and 4-gene survival predictor signatures into subgroups having statistically distinct probability of therapy failure (P &#60; 0.0001). We evaluated the prognostic power of breast cancer survival predictor signatures alone and in combination with ER and LN status using Kaplan-Meier analysis. RESULTS: The breast cancer survival predictor algorithm allowed highly accurate classification into subgroups with dramatically distinct 5- and 10-year survival after therapy of a large cohort of 295 breast cancer patients with either ER+ or ER- tumors as well as LN+ or LN- disease (P &#60; 0.0001, log-rank test). CONCLUSIONS: Our data imply that quantitative laboratory tests measuring expression profiles of a limited set of identified small gene clusters may be useful in stratification of breast cancer patients at the time of diagnosis into subgroups with statistically distinct probability of positive outcome after therapy and assisting in selection of optimal treatment strategies. The estimated increase in survival due to the optimization of treatment protocols may reach many thousands of breast cancer survivors every year at the 10-year follow-up check point.</description>
    <dc:title>Classification of human breast cancer using gene expression profiling as a component of the survival predictor algorithm.</dc:title>

    <dc:creator>GV Glinsky</dc:creator>
    <dc:creator>T Higashiyama</dc:creator>
    <dc:creator>AB Glinskii</dc:creator>
    <dc:source>Clin Cancer Res, Vol. 10, No. 7. (1 April 2004), pp. 2272-2283.</dc:source>
    <dc:date>2007-01-30T11:41:04-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Clin Cancer Res</prism:publicationName>
    <prism:issn>1078-0432</prism:issn>
    <prism:volume>10</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>2272</prism:startingPage>
    <prism:endingPage>2283</prism:endingPage>
    <prism:category>breastcancer</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/220934">
    <title>Semantic similarity measures as tools for exploring the gene ontology.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/220934</link>
    <description>&lt;i&gt;Pac Symp Biocomput (2003), pp. 601-612.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Many bioinformatics resources hold data in the form of sequences. Often this sequence data is associated with a large amount of annotation. In many cases this data has been hard to model, and has been represented as scientific natural language, which is not readily computationally amenable. The development of the Gene Ontology provides us with a more accessible representation of some of this data. However it is not clear how this data can best be searched, or queried. Recently we have adapted information content based measures for use with the Gene Ontology (GO). In this paper we present detailed investigation of the properties of these measures, and examine various properties of GO, which may have implications for its future design.</description>
    <dc:title>Semantic similarity measures as tools for exploring the gene ontology.</dc:title>

    <dc:creator>PW Lord</dc:creator>
    <dc:creator>RD Stevens</dc:creator>
    <dc:creator>A Brass</dc:creator>
    <dc:creator>CA Goble</dc:creator>
    <dc:source>Pac Symp Biocomput (2003), pp. 601-612.</dc:source>
    <dc:date>2005-06-06T17:22:22-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Pac Symp Biocomput</prism:publicationName>
    <prism:startingPage>601</prism:startingPage>
    <prism:endingPage>612</prism:endingPage>
    <prism:category>go</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/macavity1g/article/604164">
    <title>Integrated analysis of gene expression by Association Rules Discovery.</title>
    <link>http://www.citeulike.org/user/macavity1g/article/604164</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7 (2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Microarray technology is generating huge amounts of data about the expression level of thousands of genes, or even whole genomes, across different experimental conditions. To extract biological knowledge, and to fully understand such datasets, it is essential to include external biological information about genes and gene products to the analysis of expression data. However, most of the current approaches to analyze microarray datasets are mainly focused on the analysis of experimental data, and external biological information is incorporated as a posterior process. RESULTS: In this study we present a method for the integrative analysis of microarray data based on the Association Rules Discovery data mining technique. The approach integrates gene annotations and expression data to discover intrinsic associations among both data sources based on co-occurrence patterns. We applied the proposed methodology to the analysis of gene expression datasets in which genes were annotated with metabolic pathways, transcriptional regulators and Gene Ontology categories. Automatically extracted associations revealed significant relationships among these gene attributes and expression patterns, where many of them are clearly supported by recently reported work. CONCLUSION: The integration of external biological information and gene expression data can provide insights about the biological processes associated to gene expression programs. In this paper we show that the proposed methodology is able to integrate multiple gene annotations and expression data in the same analytic framework and extract meaningful associations among heterogeneous sources of data. An implementation of the method is included in the Engene software package.</description>
    <dc:title>Integrated analysis of gene expression by Association Rules Discovery.</dc:title>

    <dc:creator>P Carmona-Saez</dc:creator>
    <dc:creator>M Chagoyen</dc:creator>
    <dc:creator>A Rodriguez</dc:creator>
    <dc:creator>O Trelles</dc:creator>