<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sat, 26 Jul 2008 08:00:30 BST</pubDate>


	<title>CiteULike: oannes's library [44 articles]</title>
	<description>CiteULike: oannes's library [44 articles]</description>


	<link>http://www.citeulike.org/user/oannes</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/361175"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/1042553"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/635272"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/703785"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/445578"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/665632"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/698680"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/698679"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/687443"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/462131"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/687433"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/663253"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/679061"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/679045"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/671671"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/670259"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/670240"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/666487"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/666486"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/666464"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/656163"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/643644"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/600396"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/345227"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/620661"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/620656"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/83540"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/484846"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604899"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604898"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604897"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604896"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604894"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604893"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604892"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604258"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604257"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604248"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604247"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/233328"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604164"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/604163"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/598491"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/oannes/article/519835"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/oannes/article/361175">
    <title>A Gentle Tutorial on the EM Algorithm and its Application to Parameter Estimation for Gaussian Mixture and Hidden Markov Models</title>
    <link>http://www.citeulike.org/user/oannes/article/361175</link>
    <description>&lt;i&gt;(1997)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe the maximum-likelihood parameter estimation problem and how the ExpectationMaximization (EM) algorithm can be used for its solution. We first describe the abstract form of the EM algorithm as it is often given in the literature. We then develop the EM parameter estimation procedure for two applications: 1) finding the parameters of a mixture of Gaussian densities, and 2) finding the parameters of a hidden Markov model (HMM) (i.e., the Baum-Welch algorithm) for both discrete and...</description>
    <dc:title>A Gentle Tutorial on the EM Algorithm and its Application to Parameter Estimation for Gaussian Mixture and Hidden Markov Models</dc:title>

    <dc:creator>J Bilmes</dc:creator>
    <dc:source>(1997)</dc:source>
    <dc:date>2005-10-22T03:31:57-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/1042553">
    <title>Controlling the False Discovery Rate: A Practical and Powerful Approach to Multiple Testing</title>
    <link>http://www.citeulike.org/user/oannes/article/1042553</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The common approach to the multiplicity problem calls for controlling the familywise error rate (FWER). This approach, though, has faults, and we point out a few. A different approach to problems of multiple significance testing is presented. It calls for controlling the expected proportion of falsely rejected hypotheses-the false discovery rate. This error rate is equivalent to the FWER when all hypotheses are true but is smaller otherwise. Therefore, in problems where the control of the false discovery rate rather than that of the FWER is desired, there is potential for a gain in power. A simple sequential Bonferroni-type procedure is proved to control the false discovery rate for independent test statistics, and a simulation study shows that the gain in power is substantial. The use of the new procedure and the appropriateness of the criterion are illustrated with examples.</description>
    <dc:title>Controlling the False Discovery Rate: A Practical and Powerful Approach to Multiple Testing</dc:title>

    <dc:creator>Yoav Benjamini</dc:creator>
    <dc:creator>Yosef Hochberg</dc:creator>
    <dc:date>2007-01-15T14:09:52-00:00</dc:date>
    <prism:category>multiple</prism:category>
    <prism:category>test</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/635272">
    <title>Statistical modeling of biomedical corpora: mining the Caenorhabditis Genetic Center Bibliography for genes related to life span.</title>
    <link>http://www.citeulike.org/user/oannes/article/635272</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7, No. 1. (8 May 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;ABSTRACT: BACKGROUND: The statistical modeling of biomedical corpora could yield integrated, coarse-to-fine views of biological phenomena that complement discoveries made from analysis of molecular sequence and profiling data. Here, the potential of such modeling is demonstrated by examining the 5,225 free-text items in the Caenorhabditis Genetic Center (CGC) Bibliography using techniques from statistical information retrieval. Items in the CGC biomedical text corpus were modeled using the Latent Dirichlet Allocation (LDA) model. LDA is a hierarchical Bayesian model which represents a document as a random mixture over latent topics; each topic is characterized by a distribution over words. RESULTS: An LDA model estimated from CGC items had better predictive performance than two standard models (unigram and mixture of unigrams) trained using the same data. To illustrate the practical utility of LDA models of biomedical corpora, a trained CGC LDA model was used for a retrospective study of nematode genes known to be associated with life span modification. Corpus-, document-, and word-level LDA parameters were combined with terms from the Gene Ontology to enhance the explanatory value of the CGC LDA model, and to suggest additional candidates for age-related genes. A novel, pairwise document similarity measure based on the posterior distribution on the topic simplex was formulated and used to search the CGC database for &#34;homologs&#34; of a &#34;query&#34; document discussing the life span-modifying clk-2 gene. Inspection of these document homologs enabled and facilitated the production of hypotheses about the function and role of clk-2. CONCLUSIONS: Like other graphical models for genetic, genomic and other types of biological data, LDA provides a method for extracting unanticipated insights and generating predictions amenable to subsequent experimental validation.</description>
    <dc:title>Statistical modeling of biomedical corpora: mining the Caenorhabditis Genetic Center Bibliography for genes related to life span.</dc:title>

    <dc:creator>D Blei</dc:creator>
    <dc:creator>K Franks</dc:creator>
    <dc:creator>M Jordan</dc:creator>
    <dc:creator>I Mian</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-7-250</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 7, No. 1. (8 May 2006)</dc:source>
    <dc:date>2006-05-15T07:28:54-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>latent_semantic_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/703785">
    <title>Identifying biological concepts from a protein-related corpus with a probabilistic topic model.</title>
    <link>http://www.citeulike.org/user/oannes/article/703785</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7 (2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Biomedical literature, e.g., MEDLINE, contains a wealth of knowledge regarding functions of proteins. Major recurring biological concepts within such text corpora represent the domains of this body of knowledge. The goal of this research is to identify the major biological topics/concepts from a corpus of protein-related MEDLINE titles and abstracts by applying a probabilistic topic model. RESULTS: The latent Dirichlet allocation (LDA) model was applied to the corpus. Based on the Bayesian model selection, 300 major topics were extracted from the corpus. The majority of identified topics/concepts was found to be semantically coherent and most represented biological objects or concepts. The identified topics/concepts were further mapped to the controlled vocabulary of the Gene Ontology (GO) terms based on mutual information. CONCLUSION: The major and recurring biological concepts within a collection of MEDLINE documents can be extracted by the LDA model. The identified topics/concepts provide parsimonious and semantically-enriched representation of the texts in a semantic space with reduced dimensionality and can be used to index text.</description>
    <dc:title>Identifying biological concepts from a protein-related corpus with a probabilistic topic model.</dc:title>

    <dc:creator>B Zheng</dc:creator>
    <dc:creator>DC McLean</dc:creator>
    <dc:creator>X Lu</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-7-58</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 7 (2006)</dc:source>
    <dc:date>2006-06-20T21:22:40-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:category>latent_semantic_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/445578">
    <title>Finding genomic ontology terms in text using evidence content.</title>
    <link>http://www.citeulike.org/user/oannes/article/445578</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 6 Suppl 1 (2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: The development of text mining systems that annotate biological entities with their properties using scientific literature is an important recent research topic. These systems need first to recognize the biological entities and properties in the text, and then decide which pairs represent valid annotations. METHODS: This document introduces a novel unsupervised method for recognizing biological properties in unstructured text, involving the evidence content of their names. RESULTS: This document shows the results obtained by the application of our method to BioCreative tasks 2.1 and 2.2, where it identified Gene Ontology annotations and their evidence in a set of articles. CONCLUSION: From the performance obtained in BioCreative, we concluded that an automatic annotation system can effectively use our method to identify biological properties in unstructured text.</description>
    <dc:title>Finding genomic ontology terms in text using evidence content.</dc:title>

    <dc:creator>FM Couto</dc:creator>
    <dc:creator>MJ Silva</dc:creator>
    <dc:creator>PM Coutinho</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-6-S1-S21</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 6 Suppl 1 (2005)</dc:source>
    <dc:date>2005-12-20T16:34:59-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>6 Suppl 1</prism:volume>
    <prism:category>feature</prism:category>
    <prism:category>nlp-reading</prism:category>
    <prism:category>semantic</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/665632">
    <title>Automatically annotating documents with normalized gene lists.</title>
    <link>http://www.citeulike.org/user/oannes/article/665632</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 6 Suppl 1 (2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Document gene normalization is the problem of creating a list of unique identifiers for genes that are mentioned within a document. Automating this process has many potential applications in both information extraction and database curation systems. Here we present two separate solutions to this problem. The first is primarily based on standard pattern matching and information extraction techniques. The second and more novel solution uses a statistical classifier to recognize valid gene matches from a list of known gene synonyms. RESULTS: We compare the results of the two systems, analyze their merits and argue that the classification based system is preferable for many reasons including performance, simplicity and robustness. Our best systems attain a balanced precision and recall in the range of 74%-92%, depending on the organism.</description>
    <dc:title>Automatically annotating documents with normalized gene lists.</dc:title>

    <dc:creator>J Crim</dc:creator>
    <dc:creator>R McDonald</dc:creator>
    <dc:creator>F Pereira</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-6-S1-S13</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 6 Suppl 1 (2005)</dc:source>
    <dc:date>2006-05-22T15:27:54-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>6 Suppl 1</prism:volume>
    <prism:category>feature</prism:category>
    <prism:category>nlp-reading</prism:category>
    <prism:category>semantic</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/698680">
    <title>Finding scientific topics.</title>
    <link>http://www.citeulike.org/user/oannes/article/698680</link>
    <description>&lt;i&gt;Proc Natl Acad Sci U S A, Vol. 101 Suppl 1 (6 April 2004), pp. 5228-5235.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A first step in identifying the content of a document is determining which topics that document addresses. We describe a generative model for documents, introduced by Blei, Ng, and Jordan [Blei, D. M., Ng, A. Y. &#38; Jordan, M. I. (2003) J. Machine Learn. Res. 3, 993-1022], in which each document is generated by choosing a distribution over topics and then choosing each word in the document from a topic selected according to this distribution. We then present a Markov chain Monte Carlo algorithm for inference in this model. We use this algorithm to analyze abstracts from PNAS by using Bayesian model selection to establish the number of topics. We show that the extracted topics capture meaningful structure in the data, consistent with the class designations provided by the authors of the articles, and outline further applications of this analysis, including identifying &#34;hot topics&#34; by examining temporal dynamics and tagging abstracts to illustrate semantic content.</description>
    <dc:title>Finding scientific topics.</dc:title>

    <dc:creator>TL Griffiths</dc:creator>
    <dc:creator>M Steyvers</dc:creator>
    <dc:identifier>doi:10.1073/pnas.0307752101</dc:identifier>
    <dc:source>Proc Natl Acad Sci U S A, Vol. 101 Suppl 1 (6 April 2004), pp. 5228-5235.</dc:source>
    <dc:date>2006-06-16T19:50:07-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Proc Natl Acad Sci U S A</prism:publicationName>
    <prism:issn>0027-8424</prism:issn>
    <prism:volume>101 Suppl 1</prism:volume>
    <prism:startingPage>5228</prism:startingPage>
    <prism:endingPage>5235</prism:endingPage>
    <prism:category>latent_semantic_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/698679">
    <title>Mixed-membership models of scientific publications.</title>
    <link>http://www.citeulike.org/user/oannes/article/698679</link>
    <description>&lt;i&gt;Proc Natl Acad Sci U S A, Vol. 101 Suppl 1 (6 April 2004), pp. 5220-5227.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;PNAS is one of world's most cited multidisciplinary scientific journals. The PNAS official classification structure of subjects is reflected in topic labels submitted by the authors of articles, largely related to traditionally established disciplines. These include broad field classifications into physical sciences, biological sciences, social sciences, and further subtopic classifications within the fields. Focusing on biological sciences, we explore an internal soft-classification structure of articles based only on semantic decompositions of abstracts and bibliographies and compare it with the formal discipline classifications. Our model assumes that there is a fixed number of internal categories, each characterized by multinomial distributions over words (in abstracts) and references (in bibliographies). Soft classification for each article is based on proportions of the article's content coming from each category. We discuss the appropriateness of the model for the PNAS database as well as other features of the data relevant to soft classification.</description>
    <dc:title>Mixed-membership models of scientific publications.</dc:title>

    <dc:creator>E Erosheva</dc:creator>
    <dc:creator>S Fienberg</dc:creator>
    <dc:creator>J Lafferty</dc:creator>
    <dc:identifier>doi:10.1073/pnas.0307760101</dc:identifier>
    <dc:source>Proc Natl Acad Sci U S A, Vol. 101 Suppl 1 (6 April 2004), pp. 5220-5227.</dc:source>
    <dc:date>2006-06-16T19:49:08-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Proc Natl Acad Sci U S A</prism:publicationName>
    <prism:issn>0027-8424</prism:issn>
    <prism:volume>101 Suppl 1</prism:volume>
    <prism:startingPage>5220</prism:startingPage>
    <prism:endingPage>5227</prism:endingPage>
    <prism:category>latent_semantic_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/687443">
    <title>ITTACA: a new database for integrated tumor transcriptome array and clinical data analysis.</title>
    <link>http://www.citeulike.org/user/oannes/article/687443</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 34, No. Database issue. (1 January 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Transcriptome microarrays have become one of the tools of choice for investigating the genes involved in tumorigenesis and tumor progression, as well as finding new biomarkers and gene expression signatures for the diagnosis and prognosis of cancer. Here, we describe a new database for Integrated Tumor Transcriptome Array and Clinical data Analysis (ITTACA). ITTACA centralizes public datasets containing both gene expression and clinical data. ITTACA currently focuses on the types of cancer that are of particular interest to research teams at Institut Curie: breast carcinoma, bladder carcinoma and uveal melanoma. A web interface allows users to carry out different class comparison analyses, including the comparison of expression distribution profiles, tests for differential expression and patient survival analyses. ITTACA is complementary to other databases, such as GEO and SMD, because it offers a better integration of clinical data and different functionalities. It also offers more options for class comparison analyses when compared with similar projects such as Oncomine. For example, users can define their own patient groups according to clinical data or gene expression levels. This added flexibility and the user-friendly web interface makes ITTACA especially useful for comparing personal results with the results in the existing literature. ITTACA is accessible online at http://bioinfo.curie.fr/ittaca.</description>
    <dc:title>ITTACA: a new database for integrated tumor transcriptome array and clinical data analysis.</dc:title>

    <dc:creator>A Elfilali</dc:creator>
    <dc:creator>S Lair</dc:creator>
    <dc:creator>C Verbeke</dc:creator>
    <dc:creator>P La Rosa</dc:creator>
    <dc:creator>F Radvanyi</dc:creator>
    <dc:creator>E Barillot</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 34, No. Database issue. (1 January 2006)</dc:source>
    <dc:date>2006-06-06T20:04:40-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>34</prism:volume>
    <prism:number>Database issue</prism:number>
    <prism:category>cancer</prism:category>
    <prism:category>disease</prism:category>
    <prism:category>nar</prism:category>
    <prism:category>regulomics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/462131">
    <title>Interplay between VHL/HIF1α and Wnt/β-catenin pathways during colorectal tumorigenesis</title>
    <link>http://www.citeulike.org/user/oannes/article/462131</link>
    <description>&lt;i&gt;Oncogene, Vol. aop, No. current.&lt;/i&gt;</description>
    <dc:title>Interplay between VHL/HIF1α and Wnt/β-catenin pathways during colorectal tumorigenesis</dc:title>

    <dc:creator>RH Giles</dc:creator>
    <dc:creator>MP Lolkema</dc:creator>
    <dc:creator>CM Snijckers</dc:creator>
    <dc:creator>M Belderbos</dc:creator>
    <dc:creator>P van der Groep</dc:creator>
    <dc:creator>DA Mans</dc:creator>
    <dc:creator>M van Beest</dc:creator>
    <dc:creator>M van Noort</dc:creator>
    <dc:creator>R Goldschmeding</dc:creator>
    <dc:creator>PJ van Diest</dc:creator>
    <dc:creator>H Clevers</dc:creator>
    <dc:creator>EE Voest</dc:creator>
    <dc:identifier>doi:10.1038/sj.onc.1209330</dc:identifier>
    <dc:source>Oncogene, Vol. aop, No. current.</dc:source>
    <dc:date>2006-01-11T15:55:34-00:00</dc:date>
    <prism:publicationName>Oncogene</prism:publicationName>
    <prism:issn>0950-9232</prism:issn>
    <prism:volume>aop</prism:volume>
    <prism:number>current</prism:number>
    <prism:publisher>Nature Publishing Group</prism:publisher>
    <prism:category>disease</prism:category>
    <prism:category>vhl</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/687433">
    <title>Inactivation of von Hippel-Lindau Gene Induces Constitutive Phosphorylation of MET Protein in Clear Cell Renal Carcinoma</title>
    <link>http://www.citeulike.org/user/oannes/article/687433</link>
    <description>&lt;i&gt;Cancer Res, Vol. 66, No. 7. (1 April 2006), pp. 3699-3705.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;It is well known that inactivation of von Hippel-Lindau (VHL) gene predisposes for human clear cell renal carcinoma (CCRC). However, details about critical roles of VHL inactivation during tumorigenesis are still unknown. MET protein is a tyrosine kinase receptor for hepatocyte growth factor/scatter factor (HGF/SF), which regulates cell growth, cell morphology, and cell motility. We showed that MET protein overexpressed in CCRC cells was phosphorylated without HGF/SF. This constitutive phosphorylation of MET protein in CCRC cells was inhibited by the rescue of exogenous wild-type VHL gene without a decrease in expression level of MET protein. Interestingly, wild-type VHL gene suppressed the phosphorylation of MET protein only under high cell density conditions. Additionally, MET protein activated by the inactivation of VHL gene modified cell adherence, including N-cadherin and beta-catenin. When activation of MET protein in CCRC cells was inhibited by the MET inhibitor K252a, the growth of CCRC cells in vitro and the tumorigenesis induced by CCRC cells in nude mice were suppressed. From these results, we concluded that inactivation of VHL gene induced constitutive phosphorylation of MET protein and modified intercellular adherence structure to trigger the cell growth released from contact inhibition, finally resulting in tumorigenesis. This is one of the mechanisms of CCRC oncogenesis, and MET protein has potential as a molecular target for novel CCRC therapies. (Cancer Res 2006; 66(7): 3699-705) 10.1158/0008-5472.CAN-05-0617</description>
    <dc:title>Inactivation of von Hippel-Lindau Gene Induces Constitutive Phosphorylation of MET Protein in Clear Cell Renal Carcinoma</dc:title>

    <dc:creator>Noboru Nakaigawa</dc:creator>
    <dc:creator>Masahiro Yao</dc:creator>
    <dc:creator>Masaya Baba</dc:creator>
    <dc:creator>Shingo Kato</dc:creator>
    <dc:creator>Takeshi Kishida</dc:creator>
    <dc:creator>Keiko Hattori</dc:creator>
    <dc:creator>Yoji Nagashima</dc:creator>
    <dc:creator>Yoshinobu Kubota</dc:creator>
    <dc:source>Cancer Res, Vol. 66, No. 7. (1 April 2006), pp. 3699-3705.</dc:source>
    <dc:date>2006-06-06T19:20:12-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Cancer Res</prism:publicationName>
    <prism:volume>66</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>3699</prism:startingPage>
    <prism:endingPage>3705</prism:endingPage>
    <prism:category>disease</prism:category>
    <prism:category>vhl</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/663253">
    <title>The transcriptional regulatory code of eukaryotic cells - insights from genome-wide analysis of chromatin organization and transcription factor binding</title>
    <link>http://www.citeulike.org/user/oannes/article/663253</link>
    <description>&lt;i&gt;Current Opinion in Cell Biology, Vol. 18, No. 3. (June 2006), pp. 291-298.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Control of eukaryotic gene expression involves combinatorial interactions between transcription factors and regulatory sequences in the genome. In addition, chromatin structure and modification states play key roles in determining the competence of transcription. The term 'transcriptional regulatory code' has been used to describe the interplay of these events in the complex control of transcription. With the maturation of methods for detecting in vivo protein-DNA interactions on a genome-wide scale, detailed maps of chromatin features and transcription factor localization over entire genomes of eukaryotic cells are enriching our understanding of the properties and nature of this transcriptional regulatory code. The rapidly growing number of maps has revealed the dynamic nature of nucleosome composition and chromatin remodeling at regulatory regions and highlighted some unexpected properties of transcriptional regulatory networks in eukaryotic cells.</description>
    <dc:title>The transcriptional regulatory code of eukaryotic cells - insights from genome-wide analysis of chromatin organization and transcription factor binding</dc:title>

    <dc:creator>Leah Barrera</dc:creator>
    <dc:creator>Bing Ren</dc:creator>
    <dc:identifier>doi:10.1016/j.ceb.2006.04.002</dc:identifier>
    <dc:source>Current Opinion in Cell Biology, Vol. 18, No. 3. (June 2006), pp. 291-298.</dc:source>
    <dc:date>2006-05-21T10:55:49-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Current Opinion in Cell Biology</prism:publicationName>
    <prism:volume>18</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>291</prism:startingPage>
    <prism:endingPage>298</prism:endingPage>
    <prism:category>chromatin</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/679061">
    <title>Composite Module Analyst: a fitness-based tool for identification of transcription factor binding site combinations.</title>
    <link>http://www.citeulike.org/user/oannes/article/679061</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 10. (15 May 2006), pp. 1190-1197.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: Functionally related genes involved in the same molecular-genetic, biochemical or physiological process are often regulated coordinately. Such regulation is provided by precisely organized binding of a multiplicity of special proteins [transcription factors (TFs)] to their target sites (cis-elements) in regulatory regions of genes. Cis-element combinations provide a structural basis for the generation of unique patterns of gene expression. RESULTS: Here we present a new approach for defining promoter models based on the composition of TF binding sites and their pairs. We utilize a multicomponent fitness function for selection of the promoter model that fits best to the observed gene expression profile. We demonstrate examples of successful application of the fitness function with the help of a genetic algorithm for the analysis of functionally related or co-expressed genes as well as testing on simulated and permutated data. AVAILABILITY: The CMA program is freely available for non-commercial users. URL http://www.gene-regulation.com/pub/programs.html#CMAnalyst. It is also a part of the commercial system ExPlaintrade mark (www.biobase.de) designed for causal analysis of gene expression data. CONTACT: alexander.kel@biobase-international.com.</description>
    <dc:title>Composite Module Analyst: a fitness-based tool for identification of transcription factor binding site combinations.</dc:title>

    <dc:creator>A Kel</dc:creator>
    <dc:creator>T Konovalova</dc:creator>
    <dc:creator>T Waleev</dc:creator>
    <dc:creator>E Cheremushkin</dc:creator>
    <dc:creator>O Kel-Margoulis</dc:creator>
    <dc:creator>E Wingender</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 10. (15 May 2006), pp. 1190-1197.</dc:source>
    <dc:date>2006-06-01T02:18:32-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>10</prism:number>
    <prism:startingPage>1190</prism:startingPage>
    <prism:endingPage>1197</prism:endingPage>
    <prism:category>crm</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/679045">
    <title>Human Transcription Factors Contain a High Fraction of Intrinsically Disordered Regions Essential for Transcriptional Regulation.</title>
    <link>http://www.citeulike.org/user/oannes/article/679045</link>
    <description>&lt;i&gt;J Mol Biol (25 April 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Human transcriptional regulation factors, such as activators, repressors, and enhancer-binding factors are quite different from their prokaryotic counterparts in two respects: the average sequence in human is more than twice as long as that in prokaryotes, while the fraction of sequence aligned to domains of known structure is 31% in human transcription factors (TFs), less than half of that in bacterial TFs (72%). Intrinsically disordered (ID) regions were identified by a disorder-prediction program, and were found to be in good agreement with available experimental data. Analysis of 401 human TFs with experimental evidence from the Swiss-Prot database showed that as high as 49% of the entire sequence of human TFs is occupied by ID regions. More than half of the human TFs consist of a small DNA binding domain (DBD) and long ID regions frequently sandwiching unassigned regions. The remaining TFs have structural domains in addition to DBDs and ID regions. Experimental studies, particularly those with NMR, revealed that the transactivation domains in unbound TFs are usually unstructured, but become structured upon binding to their partners. The sequences of human and mouse TF orthologues are 90.5% identical despite a high incidence of ID regions, probably reflecting important functional roles played by ID regions. In general ID regions occupy a high fraction in TFs of eukaryotes, but not in prokaryotes. Implications of this dichotomy are discussed in connection with their functional roles in transcriptional regulation and evolution.</description>
    <dc:title>Human Transcription Factors Contain a High Fraction of Intrinsically Disordered Regions Essential for Transcriptional Regulation.</dc:title>

    <dc:creator>Yoshiaki Minezaki</dc:creator>
    <dc:creator>Keiichi Homma</dc:creator>
    <dc:creator>Akira R Kinjo</dc:creator>
    <dc:creator>Ken Nishikawa</dc:creator>
    <dc:identifier>doi:10.1016/j.jmb.2006.04.016</dc:identifier>
    <dc:source>J Mol Biol (25 April 2006)</dc:source>
    <dc:date>2006-06-01T02:12:22-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>J Mol Biol</prism:publicationName>
    <prism:issn>0022-2836</prism:issn>
    <prism:category>structure</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/671671">
    <title>BioMed Central | Abstract | 1471-2105-7-229 | Meta-analysis discovery of tissue-specific DNA sequence motifs from mammalian gene expression data</title>
    <link>http://www.citeulike.org/user/oannes/article/671671</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>BioMed Central | Abstract | 1471-2105-7-229 | Meta-analysis discovery of tissue-specific DNA sequence motifs from mammalian gene expression data</dc:title>

    <dc:date>2006-05-26T20:47:37-00:00</dc:date>
    <prism:category>crm</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/670259">
    <title>Transcription in four dimensions: nuclear receptor-directed initiation of gene expression.</title>
    <link>http://www.citeulike.org/user/oannes/article/670259</link>
    <description>&lt;i&gt;EMBO Rep, Vol. 7, No. 2. (February 2006), pp. 161-167.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Regulated gene expression, achieved through the coordinated assembly of transcription factors, co-regulators and the basal transcription machinery on promoters, is an initial step in accomplishing cell specificity and homeostasis. Traditional models of transcriptional regulation tend to be static, although gene expression profiles change with time to adapt to developmental and environmental cues. Furthermore, biochemical and structural studies have determined that initiation of transcription progresses through a series of ordered events. By integrating time into the analysis of transcription, chromatin immunoprecipitation assays and live-cell imaging techniques have revealed the dynamic, cooperative, functionally redundant and cyclical nature of gene expression. In this review, we present a dynamic model of gene transcription that integrates data obtained by these two techniques.</description>
    <dc:title>Transcription in four dimensions: nuclear receptor-directed initiation of gene expression.</dc:title>

    <dc:creator>R Métivier</dc:creator>
    <dc:creator>G Reid</dc:creator>
    <dc:creator>F Gannon</dc:creator>
    <dc:identifier>doi:10.1038/sj.embor.7400626</dc:identifier>
    <dc:source>EMBO Rep, Vol. 7, No. 2. (February 2006), pp. 161-167.</dc:source>
    <dc:date>2006-05-25T16:26:07-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>EMBO Rep</prism:publicationName>
    <prism:issn>1469-221X</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>161</prism:startingPage>
    <prism:endingPage>167</prism:endingPage>
    <prism:category>dynamic</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/670240">
    <title>SUMO and ubiquitin in the nucleus: different functions, similar mechanisms?</title>
    <link>http://www.citeulike.org/user/oannes/article/670240</link>
    <description>&lt;i&gt;Genes Dev., Vol. 18, No. 17. (1 September 2004), pp. 2046-2059.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The small ubiquitin-related modifier SUMO posttranslationally modifies many proteins with roles in diverse processes including regulation of transcription, chromatin structure, and DNA repair. Similar to nonproteolytic roles of ubiquitin, SUMO modification regulates protein localization and activity. Some proteins can be modified by SUMO and ubiquitin, but with distinct functional consequences. It is possible that the effects of ubiquitination and SUMOylation are both largely due to binding of proteins bearing specific interaction domains. Both modifications are reversible, and in some cases dynamic cycles of modification may be required for activity. Studies of SUMO and ubiquitin in the nucleus are yielding new insights into regulation of gene expression, genome maintenance, and signal transduction. 10.1101/gad.1214604</description>
    <dc:title>SUMO and ubiquitin in the nucleus: different functions, similar mechanisms?</dc:title>

    <dc:creator>Grace Gill</dc:creator>
    <dc:identifier>doi:10.1101/gad.1214604</dc:identifier>
    <dc:source>Genes Dev., Vol. 18, No. 17. (1 September 2004), pp. 2046-2059.</dc:source>
    <dc:date>2006-05-25T16:12:34-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Genes Dev.</prism:publicationName>
    <prism:volume>18</prism:volume>
    <prism:number>17</prism:number>
    <prism:startingPage>2046</prism:startingPage>
    <prism:endingPage>2059</prism:endingPage>
    <prism:category>sumo</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/666487">
    <title>Contrasting effects on HIF-1alpha regulation by disease-causing pVHL mutations correlate with patterns of tumourigenesis in von Hippel-Lindau disease.</title>
    <link>http://www.citeulike.org/user/oannes/article/666487</link>
    <description>&lt;i&gt;Hum Mol Genet, Vol. 10, No. 10. (1 May 2001), pp. 1029-1038.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The von Hippel-Lindau tumour suppressor gene product (pVHL) associates with the elongin B and C and Cul2 proteins to form a ubiquitin-ligase complex (VCBC). To date, the only VCBC substrates identified are the hypoxia-inducible factor alpha subunits (HIF-1alpha and HIF-2alpha). However, pVHL is thought to have multiple functions and the significance of HIF-1alpha and HIF-2alpha regulation for tumour suppressor activity has not been defined. VHL disease is characterized by distinct clinical subtypes. Thus haemangioblastomas (HABs) and renal cell carcinoma (RCC) but not phaeochromocytoma (PHE) occur in type 1 VHL disease. Type 2 subtypes are characterized by PHE susceptibility but differ with respect to additional tumours (type 2A, PHE+HAB but not RCC; type 2B, PHE+ HAB+RCC; type 2C, PHE only). We investigated in detail the effect of 13 naturally occurring VHL mutations (11 missense), representing each phenotypic subclass, on HIF-alpha subunit regulation. Consistent effects on pVHL function were observed for all mutations within each subclass. Mutations associated with the PHE-only phenotype (type 2C) promoted HIF-alpha ubiquitylation in vitro and demonstrated wild-type binding patterns with pVHL interacting proteins, suggesting that loss of other pVHL functions are necessary for PHE susceptibility. Mutations causing HAB susceptibility (types 1, 2A and 2B) demonstrated variable effects on HIF-alpha subunit and elongin binding, but all resulted in defective HIF-alpha regulation and loss of p220 (fibronectin) binding. All RCC-associated mutations caused complete HIF-alpha dysregulation and loss of p220 (fibronectin) binding. Our findings are consistent with impaired ability to degrade HIF-alpha subunit being required for HAB development and RCC susceptibility.</description>
    <dc:title>Contrasting effects on HIF-1alpha regulation by disease-causing pVHL mutations correlate with patterns of tumourigenesis in von Hippel-Lindau disease.</dc:title>

    <dc:creator>SC Clifford</dc:creator>
    <dc:creator>ME Cockman</dc:creator>
    <dc:creator>AC Smallwood</dc:creator>
    <dc:creator>DR Mole</dc:creator>
    <dc:creator>ER Woodward</dc:creator>
    <dc:creator>PH Maxwell</dc:creator>
    <dc:creator>PJ Ratcliffe</dc:creator>
    <dc:creator>ER Maher</dc:creator>
    <dc:source>Hum Mol Genet, Vol. 10, No. 10. (1 May 2001), pp. 1029-1038.</dc:source>
    <dc:date>2006-05-23T19:34:46-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>Hum Mol Genet</prism:publicationName>
    <prism:issn>0964-6906</prism:issn>
    <prism:volume>10</prism:volume>
    <prism:number>10</prism:number>
    <prism:startingPage>1029</prism:startingPage>
    <prism:endingPage>1038</prism:endingPage>
    <prism:category>disease</prism:category>
    <prism:category>vhl</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/666486">
    <title>p53 Stabilization and Transactivation by a von Hippel-Lindau Protein.</title>
    <link>http://www.citeulike.org/user/oannes/article/666486</link>
    <description>&lt;i&gt;Mol Cell, Vol. 22, No. 3. (5 May 2006), pp. 395-405.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;von Hippel-Lindau (VHL) disease is a rare autosomal dominant cancer syndrome. Although hypoxia-inducible factor-alpha (HIFalpha) is a well-documented substrate of von Hippel-Lindau tumor suppressor protein (pVHL), it remains unclear whether the dysregulation of HIF is sufficient to account for de novo tumorigenesis in VHL-deleted cells. Here we found that pVHL directly associates with and stabilizes p53 by suppressing Mdm2-mediated ubiquitination and nuclear export of p53. Moreover, upon genotoxic stress, pVHL invoked an interaction between p53 and p300 and the acetylation of p53, which ultimately led to an increase in p53 transcriptional activity and p53-mediated cell cycle arrest and apoptosis. These results suggest that the tumor suppressor pVHL has an unexpected function to upregulate the tumor suppressor p53.</description>
    <dc:title>p53 Stabilization and Transactivation by a von Hippel-Lindau Protein.</dc:title>

    <dc:creator>JS Roe</dc:creator>
    <dc:creator>H Kim</dc:creator>
    <dc:creator>SM Lee</dc:creator>
    <dc:creator>ST Kim</dc:creator>
    <dc:creator>EJ Cho</dc:creator>
    <dc:creator>HD Youn</dc:creator>
    <dc:identifier>doi:10.1016/j.molcel.2006.04.006</dc:identifier>
    <dc:source>Mol Cell, Vol. 22, No. 3. (5 May 2006), pp. 395-405.</dc:source>
    <dc:date>2006-05-23T19:31:11-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Mol Cell</prism:publicationName>
    <prism:issn>1097-2765</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>395</prism:startingPage>
    <prism:endingPage>405</prism:endingPage>
    <prism:category>disease</prism:category>
    <prism:category>vhl</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/666464">
    <title>Hypoxia-inducible factors: where, when and why?</title>
    <link>http://www.citeulike.org/user/oannes/article/666464</link>
    <description>&lt;i&gt;Vol. 69, No. 1. (0000), pp. 15-17.&lt;/i&gt;</description>
    <dc:title>Hypoxia-inducible factors: where, when and why?</dc:title>

    <dc:creator>JM Gleadle</dc:creator>
    <dc:creator>DR Mole</dc:creator>
    <dc:creator>CW Pugh</dc:creator>
    <dc:identifier>doi:10.1038/sj.ki.5000072</dc:identifier>
    <dc:source>Vol. 69, No. 1. (0000), pp. 15-17.</dc:source>
    <dc:date>2006-05-23T19:14:29-00:00</dc:date>
    <prism:publicationYear>0000</prism:publicationYear>
    <prism:volume>69</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>15</prism:startingPage>
    <prism:endingPage>17</prism:endingPage>
    <prism:category>disease</prism:category>
    <prism:category>vhl</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/656163">
    <title>Activation of TRAP/Mediator Subunit TRAP220/Med1 Is Regulated by Mitogen-Activated Protein Kinase-Dependent Phosphorylation</title>
    <link>http://www.citeulike.org/user/oannes/article/656163</link>
    <description>&lt;i&gt;Mol. Cell. Biol., Vol. 25, No. 24. (15 December 2005), pp. 10695-10710.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The TRAP/Mediator coactivator complex serves as a molecular bridge between gene-specific activators and RNA polymerase II. TRAP220/Med1 is a key component of TRAP/Mediator that targets the complex to nuclear hormone receptors and other types of activators. We show here that human TRAP220/Med1 is a specific substrate for extracellular signal-regulated kinase (ERK) of the mitogen-activated protein kinase (MAPK) family. We demonstrate that ERK phosphorylates TRAP220/Med1 in vivo at two specific sites: threonine 1032 and threonine 1457. Importantly, we found that ERK phosphorylation significantly increases the stability and half-life of TRAP220/Med1 in vivo and correlates with increased thyroid hormone receptor-dependent transcription. Furthermore, ERK phosphorylates TRAP220/Med1 in a cell cycle-dependent manner, resulting in peak levels of expression during the G2/M phase of the cell cycle. ERK phosphorylation of ectopic TRAP220/Med1 also triggered shuttling into the nucleolus, thus suggesting that ERK may regulate TRAP220/Med1 subnuclear localization. Finally, we observed that ERK phosphorylation of TRAP220/Med1 stimulates its intrinsic transcriptional coactivation activity. We propose that ERK-mediated phosphorylation is a regulatory mechanism that controls TRAP220/Med1 expression levels and modulates its functional activity.</description>
    <dc:title>Activation of TRAP/Mediator Subunit TRAP220/Med1 Is Regulated by Mitogen-Activated Protein Kinase-Dependent Phosphorylation</dc:title>

    <dc:creator>Pradeep Pandey</dc:creator>
    <dc:creator>TS Udayakumar</dc:creator>
    <dc:creator>Xinjie Lin</dc:creator>
    <dc:creator>Dipali Sharma</dc:creator>
    <dc:creator>Paul Shapiro</dc:creator>
    <dc:creator>Joseph Fondell</dc:creator>
    <dc:identifier>doi:10.1128/MCB.25.24.10695</dc:identifier>
    <dc:source>Mol. Cell. Biol., Vol. 25, No. 24. (15 December 2005), pp. 10695-10710.</dc:source>
    <dc:date>2006-05-18T22:15:32-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Mol. Cell. Biol.</prism:publicationName>
    <prism:volume>25</prism:volume>
    <prism:number>24</prism:number>
    <prism:startingPage>10695</prism:startingPage>
    <prism:endingPage>10710</prism:endingPage>
    <prism:category>mediator</prism:category>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/643644">
    <title>Quantitative evaluation of protein-DNA interactions using an optimized knowledge-based potential.</title>
    <link>http://www.citeulike.org/user/oannes/article/643644</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 33, No. 2. (2005), pp. 546-558.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Computational evaluation of protein-DNA interaction is important for the identification of DNA-binding sites and genome annotation. It could validate the predicted binding motifs by sequence-based approaches through the calculation of the binding affinity between a protein and DNA. Such an evaluation should take into account structural information to deal with the complicated effects from DNA structural deformation, distance-dependent multi-body interactions and solvation contributions. In this paper, we present a knowledge-based potential built on interactions between protein residues and DNA tri-nucleotides. The potential, which explicitly considers the distance-dependent two-body, three-body and four-body interactions between protein residues and DNA nucleotides, has been optimized in terms of a Z-score. We have applied this knowledge-based potential to evaluate the binding affinities of zinc-finger protein-DNA complexes. The predicted binding affinities are in good agreement with the experimental data (with a correlation coefficient of 0.950). On a larger test set containing 48 protein-DNA complexes with known experimental binding free energies, our potential has achieved a high correlation coefficient of 0.800, when compared with the experimental data. We have also used this potential to identify binding motifs in DNA sequences of transcription factors (TF). The TFs in 79.4% of the known TF-DNA complexes have accurately found their native binding sequences from a large pool of DNA sequences. When tested in a genome-scale search for TF-binding motifs of the cyclic AMP regulatory protein (CRP) of Escherichia coli, this potential ranks all known binding motifs of CRP in the top 15% of all candidate sequences.</description>
    <dc:title>Quantitative evaluation of protein-DNA interactions using an optimized knowledge-based potential.</dc:title>

    <dc:creator>Z Liu</dc:creator>
    <dc:creator>F Mao</dc:creator>
    <dc:creator>JT Guo</dc:creator>
    <dc:creator>B Yan</dc:creator>
    <dc:creator>P Wang</dc:creator>
    <dc:creator>Y Qu</dc:creator>
    <dc:creator>Y Xu</dc:creator>
    <dc:identifier>doi:10.1093/nar/gki204</dc:identifier>
    <dc:source>Nucleic Acids Res, Vol. 33, No. 2. (2005), pp. 546-558.</dc:source>
    <dc:date>2006-05-18T04:57:23-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>33</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>546</prism:startingPage>
    <prism:endingPage>558</prism:endingPage>
    <prism:category>structure</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/600396">
    <title>Modeling gene expression control using Omes Law</title>
    <link>http://www.citeulike.org/user/oannes/article/600396</link>
    <description>&lt;i&gt;Mol Syst Biol, Vol. 2, No. 1. (11 April 2006), pp. msb4100055-E1-msb4100055-E3.&lt;/i&gt;</description>
    <dc:title>Modeling gene expression control using Omes Law</dc:title>

    <dc:creator>Harmen Bussemaker</dc:creator>
    <dc:identifier>doi:10.1038/msb4100055</dc:identifier>
    <dc:source>Mol Syst Biol, Vol. 2, No. 1. (11 April 2006), pp. msb4100055-E1-msb4100055-E3.</dc:source>
    <dc:date>2006-04-25T15:45:52-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Mol Syst Biol</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>msb4100055-E1</prism:startingPage>
    <prism:endingPage>msb4100055-E3</prism:endingPage>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/345227">
    <title>Local Regulatory Variation in Saccharomyces cerevisiae.</title>
    <link>http://www.citeulike.org/user/oannes/article/345227</link>
    <description>&lt;i&gt;PLoS Genet, Vol. 1, No. 2. (19 August 2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Naturally occurring sequence variation that affects gene expression is an important source of phenotypic differences among individuals within a species. We and others have previously shown that such regulatory variation can occur both at the same locus as the gene whose expression it affects (local regulatory variation) and elsewhere in the genome at trans-acting factors. Here we present a detailed analysis of genome-wide local regulatory variation in Saccharomyces cerevisiae. We used genetic linkage analysis to show that nearly a quarter of all yeast genes contain local regulatory variation between two divergent strains. We measured allele-specific expression in a diploid hybrid of the two strains for 77 genes showing strong self-linkage and found that in 52%-78% of these genes, local regulatory variation acts directly in cis. We also experimentally confirmed one example in which local regulatory variation in the gene AMN1 acts in trans through a feedback loop. Genome-wide sequence analysis revealed that genes subject to local regulatory variation show increased polymorphism in the promoter regions, and that some but not all of this increase is due to polymorphisms in predicted transcription factor binding sites. Increased polymorphism was also found in the 3' untranslated regions of these genes. These findings point to the importance of cis-acting variation, but also suggest that there is a diverse set of mechanisms through which local variation can affect gene expression levels.</description>
    <dc:title>Local Regulatory Variation in Saccharomyces cerevisiae.</dc:title>

    <dc:creator>James Ronald</dc:creator>
    <dc:creator>Rachel B Brem</dc:creator>
    <dc:creator>Jacqueline Whittle</dc:creator>
    <dc:creator>Leonid Kruglyak</dc:creator>
    <dc:identifier>doi:10.1371/journal.pgen.0010025</dc:identifier>
    <dc:source>PLoS Genet, Vol. 1, No. 2. (19 August 2005)</dc:source>
    <dc:date>2005-10-07T21:11:53-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>PLoS Genet</prism:publicationName>
    <prism:issn>1553-7390</prism:issn>
    <prism:volume>1</prism:volume>
    <prism:number>2</prism:number>
    <prism:category>qtl</prism:category>
    <prism:category>regulomics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/620661">
    <title>Trans-acting regulatory variation in Saccharomyces cerevisiae and the role of transcription factors</title>
    <link>http://www.citeulike.org/user/oannes/article/620661</link>
    <description>&lt;i&gt;Nat Genet, Vol. 35, No. 1. (2003), pp. 57-64.&lt;/i&gt;</description>
    <dc:title>Trans-acting regulatory variation in Saccharomyces cerevisiae and the role of transcription factors</dc:title>

    <dc:creator>Gael Yvert</dc:creator>
    <dc:creator>Rachel Brem</dc:creator>
    <dc:creator>Jacqueline Whittle</dc:creator>
    <dc:creator>Joshua Akey</dc:creator>
    <dc:creator>Eric Foss</dc:creator>
    <dc:creator>Erin Smith</dc:creator>
    <dc:creator>Rachel Mackelprang</dc:creator>
    <dc:creator>Leonid Kruglyak</dc:creator>
    <dc:identifier>doi:10.1038/ng1222</dc:identifier>
    <dc:source>Nat Genet, Vol. 35, No. 1. (2003), pp. 57-64.</dc:source>
    <dc:date>2006-05-09T19:48:36-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Nat Genet</prism:publicationName>
    <prism:volume>35</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>57</prism:startingPage>
    <prism:endingPage>64</prism:endingPage>
    <prism:category>qtl</prism:category>
    <prism:category>regulomics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/620656">
    <title>Genetic Dissection of Transcriptional Regulation in Budding Yeast</title>
    <link>http://www.citeulike.org/user/oannes/article/620656</link>
    <description>&lt;i&gt;Science, Vol. 296, No. 5568. (26 April 2002), pp. 752-755.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;10.1126/science.1069516</description>
    <dc:title>Genetic Dissection of Transcriptional Regulation in Budding Yeast</dc:title>

    <dc:creator>Rachel Brem</dc:creator>
    <dc:creator>Gael Yvert</dc:creator>
    <dc:creator>Rebecca Clinton</dc:creator>
    <dc:creator>Leonid Kruglyak</dc:creator>
    <dc:identifier>doi:10.1126/science.1069516</dc:identifier>
    <dc:source>Science, Vol. 296, No. 5568. (26 April 2002), pp. 752-755.</dc:source>
    <dc:date>2006-05-09T19:40:57-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Science</prism:publicationName>
    <prism:volume>296</prism:volume>
    <prism:number>5568</prism:number>
    <prism:startingPage>752</prism:startingPage>
    <prism:endingPage>755</prism:endingPage>
    <prism:category>qtl</prism:category>
    <prism:category>regulomics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/83540">
    <title>Learning the parts of objects by non-negative matrix factorization.</title>
    <link>http://www.citeulike.org/user/oannes/article/83540</link>
    <description>&lt;i&gt;Nature, Vol. 401, No. 6755. (21 October 1999), pp. 788-791.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Is perception of the whole based on perception of its parts? There is psychological and physiological evidence for parts-based representations in the brain, and certain computational theories of object recognition rely on such representations. But little is known about how brains or computers might learn the parts of objects. Here we demonstrate an algorithm for non-negative matrix factorization that is able to learn parts of faces and semantic features of text. This is in contrast to other methods, such as principal components analysis and vector quantization, that learn holistic, not parts-based, representations. Non-negative matrix factorization is distinguished from the other methods by its use of non-negativity constraints. These constraints lead to a parts-based representation because they allow only additive, not subtractive, combinations. When non-negative matrix factorization is implemented as a neural network, parts-based representations emerge by virtue of two properties: the firing rates of neurons are never negative and synaptic strengths do not change sign.</description>
    <dc:title>Learning the parts of objects by non-negative matrix factorization.</dc:title>

    <dc:creator>DD Lee</dc:creator>
    <dc:creator>HS Seung</dc:creator>
    <dc:identifier>doi:10.1038/44565</dc:identifier>
    <dc:source>Nature, Vol. 401, No. 6755. (21 October 1999), pp. 788-791.</dc:source>
    <dc:date>2005-01-25T22:33:12-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:issn>0028-0836</prism:issn>
    <prism:volume>401</prism:volume>
    <prism:number>6755</prism:number>
    <prism:startingPage>788</prism:startingPage>
    <prism:endingPage>791</prism:endingPage>
    <prism:category>feature</prism:category>
    <prism:category>nlp-reading</prism:category>
    <prism:category>semantic</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/484846">
    <title>Discovering semantic features in the literature: a foundation for building functional associations.</title>
    <link>http://www.citeulike.org/user/oannes/article/484846</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7, No. 1. (26 January 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;ABSTRACT: BACKGROUND: Experimental techniques such as DNA microarray, serial analysis of gene expression (SAGE) and mass spectrometry proteomics, among others, are generating large amounts of data related to genes and proteins at different levels. As in any other experimental approach, it is necessary to analyze these data in the context of previously known information about the biological entities under study. The literature is a particularly valuable source of information for experiment validation and interpretation. Therefore, the development of automated text mining tools to assist in such interpretation is one of the main challenges in current bioinformatics research. RESULTS: We present a method to create literature profiles for large sets of genes or proteins based on common semantic features extracted from a corpus of relevant documents. These profiles can be used to establish pair-wise similarities among genes, utilized in gene/protein classification or can be even combined with experimental measurements. Semantic features can be used by researchers to facilitate the understanding of the commonalities indicated by experimental results. Our approach is based on non-negative matrix factorization (NMF), a machine-learning algorithm for data analysis, capable of identifying local patterns that characterize a subset of the data. The literature is thus used to establish putative relationships among subsets of genes or proteins and to provide coherent justification for this clustering into subsets. We demonstrate the utility of the method by applying it to two independent and vastly different sets of genes. CONCLUSIONS: The presented method can create literature profiles from documents relevant to sets of genes. The representation of genes as additive linear combinations of semantic features allows for the exploration of functional associations as well as for clustering, suggesting a valuable methodology for the validation and interpretation of high-throughput experimental data.</description>
    <dc:title>Discovering semantic features in the literature: a foundation for building functional associations.</dc:title>

    <dc:creator>Monica Chagoyen</dc:creator>
    <dc:creator>Pedro Carmona-Saez</dc:creator>
    <dc:creator>Hagit Shatkay</dc:creator>
    <dc:creator>Jose Carazo</dc:creator>
    <dc:creator>Alberto Pascual-Montano</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-7-41</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 7, No. 1. (26 January 2006)</dc:source>
    <dc:date>2006-01-29T14:32:39-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>feature</prism:category>
    <prism:category>nlp-reading</prism:category>
    <prism:category>semantic</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604899">
    <title>Genome-wide computational prediction of transcriptional regulatory modules reveals new insights into human gene expression.</title>
    <link>http://www.citeulike.org/user/oannes/article/604899</link>
    <description>&lt;i&gt;Genome Res (10 April 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The identification of regulatory regions is one of the most important and challenging problems toward the functional annotation of the human genome. In higher eukaryotes, transcription-factor (TF) binding sites are often organized in clusters called cis-regulatory modules (CRM). While the prediction of individual TF-binding sites is a notoriously difficult problem, CRM prediction has proven to be somewhat more reliable. Starting from a set of predicted binding sites for more than 200 TF families documented in Transfac, we describe an algorithm relying on the principle that CRMs generally contain several phylogenetically conserved binding sites for a few different TFs. The method allows the prediction of more than 118,000 CRMs within the human genome. A subset of these is shown to be bound in vivo by TFs using ChIP-chip. Their analysis reveals, among other things, that CRM density varies widely across the genome, with CRM-rich regions often being located near genes encoding transcription factors involved in development. Predicted CRMs show a surprising enrichment near the 3' end of genes and in regions far from genes. We document the tendency for certain TFs to bind modules located in specific regions with respect to their target genes and identify TFs likely to be involved in tissue-specific regulation. The set of predicted CRMs, which is made available as a public database called PReMod (http://genomequebec.mcgill.ca/PReMod), will help analyze regulatory mechanisms in specific biological systems.</description>
    <dc:title>Genome-wide computational prediction of transcriptional regulatory modules reveals new insights into human gene expression.</dc:title>

    <dc:creator>Mathieu Blanchette</dc:creator>
    <dc:creator>Alain R Bataille</dc:creator>
    <dc:creator>Xiaoyu Chen</dc:creator>
    <dc:creator>Christian Poitras</dc:creator>
    <dc:creator>Josée Laganière</dc:creator>
    <dc:creator>Céline Lefèbvre</dc:creator>
    <dc:creator>Geneviève Deblois</dc:creator>
    <dc:creator>Vincent Giguère</dc:creator>
    <dc:creator>Vincent Ferretti</dc:creator>
    <dc:creator>Dominique Bergeron</dc:creator>
    <dc:creator>Benoit Coulombe</dc:creator>
    <dc:creator>François Robert</dc:creator>
    <dc:identifier>doi:10.1101/gr.4866006</dc:identifier>
    <dc:source>Genome Res (10 April 2006)</dc:source>
    <dc:date>2006-04-27T19:23:55-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Genome Res</prism:publicationName>
    <prism:issn>1088-9051</prism:issn>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604898">
    <title>Protein-DNA binding specificity predictions with structural models.</title>
    <link>http://www.citeulike.org/user/oannes/article/604898</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 33, No. 18. (2005), pp. 5781-5798.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Protein-DNA interactions play a central role in transcriptional regulation and other biological processes. Investigating the mechanism of binding affinity and specificity in protein-DNA complexes is thus an important goal. Here we develop a simple physical energy function, which uses electrostatics, solvation, hydrogen bonds and atom-packing terms to model direct readout and sequence-specific DNA conformational energy to model indirect readout of DNA sequence by the bound protein. The predictive capability of the model is tested against another model based only on the knowledge of the consensus sequence and the number of contacts between amino acids and DNA bases. Both models are used to carry out predictions of protein-DNA binding affinities which are then compared with experimental measurements. The nearly additive nature of protein-DNA interaction energies in our model allows us to construct position-specific weight matrices by computing base pair probabilities independently for each position in the binding site. Our approach is less data intensive than knowledge-based models of protein-DNA interactions, and is not limited to any specific family of transcription factors. However, native structures of protein-DNA complexes or their close homologs are required as input to the model. Use of homology modeling can significantly increase the extent of our approach, making it a useful tool for studying regulatory pathways in many organisms and cell types.</description>
    <dc:title>Protein-DNA binding specificity predictions with structural models.</dc:title>

    <dc:creator>AV Morozov</dc:creator>
    <dc:creator>JJ Havranek</dc:creator>
    <dc:creator>D Baker</dc:creator>
    <dc:creator>ED Siggia</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 33, No. 18. (2005), pp. 5781-5798.</dc:source>
    <dc:date>2006-04-27T19:19:28-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>33</prism:volume>
    <prism:number>18</prism:number>
    <prism:startingPage>5781</prism:startingPage>
    <prism:endingPage>5798</prism:endingPage>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604897">
    <title>Annotating significant pairs of transcription factor binding sites in regulatory DNA.</title>
    <link>http://www.citeulike.org/user/oannes/article/604897</link>
    <description>&lt;i&gt;In Silico Biol, Vol. 4, No. 4. (2004), pp. 479-487.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In the presented work we search for transcription factor binding sites (BS) by including additional information about typical BS patterns. The new proposed score combines the ordinary profile score based on TRANSFAC-matrices together with a score based on pairs of BS. The latter score positively weights pairs of BS that tend to occur together in many regulatory DNA-sequences, in contrast to a random background model. The empirical BS pair frequencies result from our evaluation of a large dataset of orthologous genes.</description>
    <dc:title>Annotating significant pairs of transcription factor binding sites in regulatory DNA.</dc:title>

    <dc:creator>K Rateitschak</dc:creator>
    <dc:creator>T Müller</dc:creator>
    <dc:creator>M Vingron</dc:creator>
    <dc:source>In Silico Biol, Vol. 4, No. 4. (2004), pp. 479-487.</dc:source>
    <dc:date>2006-04-27T19:17:17-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>In Silico Biol</prism:publicationName>
    <prism:issn>1386-6338</prism:issn>
    <prism:volume>4</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>479</prism:startingPage>
    <prism:endingPage>487</prism:endingPage>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604896">
    <title>Distance preferences in the arrangement of binding motifs and hierarchical levels in organization of transcription regulatory information.</title>
    <link>http://www.citeulike.org/user/oannes/article/604896</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 31, No. 20. (15 October 2003), pp. 6016-6026.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We explored distance preferences in the arrangement of binding motifs for five transcription factors (Bicoid, Krüppel, Hunchback, Knirps and Caudal) in a large set of Drosophila cis-regulatory modules (CRMs). Analysis of non-overlapping binding motifs revealed the presence of periodic signals specific to particular combinations of binding motifs. The most striking periodic signals (10 bp for Bicoid and 11 bp for Hunchback) suggest preferential positioning of some binding site combinations on the same side of the DNA helix. We also analyzed distance preferences in arrangements of highly correlated overlapping binding motifs, such as Bicoid and Krüppel. Based on the distance analysis, we extracted preferential binding site arrangements and proposed models for potential composite elements (CEs) and antagonistic motif pairs involved in the function of developmental CRMs. Our results suggest that there are distinct hierarchical levels in the organization of transcription regulatory information. We discuss the role of the hierarchy in understanding transcriptional regulation and in detection of transcription regulatory regions in genomes.</description>
    <dc:title>Distance preferences in the arrangement of binding motifs and hierarchical levels in organization of transcription regulatory information.</dc:title>

    <dc:creator>VJ Makeev</dc:creator>
    <dc:creator>AP Lifanov</dc:creator>
    <dc:creator>AG Nazina</dc:creator>
    <dc:creator>DA Papatsenko</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 31, No. 20. (15 October 2003), pp. 6016-6026.</dc:source>
    <dc:date>2006-04-27T19:16:12-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>31</prism:volume>
    <prism:number>20</prism:number>
    <prism:startingPage>6016</prism:startingPage>
    <prism:endingPage>6026</prism:endingPage>
    <prism:category>distance</prism:category>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604894">
    <title>Predicting transcription factor synergism.</title>
    <link>http://www.citeulike.org/user/oannes/article/604894</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 30, No. 19. (1 October 2002), pp. 4278-4284.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Transcriptional regulation is mediated by a battery of transcription factor (TF) proteins, that form complexes involving protein-protein and protein-DNA interactions. Individual TFs bind to their cognate cis-elements or transcription factor-binding sites (TFBS). TFBS are organized on the DNA proximal to the gene in groups confined to a few hundred base pair regions. These groups are referred to as modules. Various modules work together to provide the combinatorial regulation of gene transcription in response to various developmental and environmental conditions. The sets of modules constitute a promoter model. Determining the TFs that preferentially work in concert as part of a module is an essential component of understanding transcriptional regulation. The TFs that act synergistically in such a fashion are likely to have their cis-elements co-localized on the genome at specific distances apart. We exploit this notion to predict TF pairs that are likely to be part of a transcriptional module on the human genome sequence. The computational method is validated statistically, using known interacting pairs extracted from the literature. There are 251 TFBS pairs up to 50 bp apart and 70 TFBS pairs up to 200 bp apart that score higher than any of the known synergistic pairs. Further investigation of 50 pairs randomly selected from each of these two sets using PubMed queries provided additional supporting evidence from the existing biological literature suggesting TF synergism for these novel pairs.</description>
    <dc:title>Predicting transcription factor synergism.</dc:title>

    <dc:creator>S Hannenhalli</dc:creator>
    <dc:creator>S Levy</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 30, No. 19. (1 October 2002), pp. 4278-4284.</dc:source>
    <dc:date>2006-04-27T19:13:09-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>30</prism:volume>
    <prism:number>19</prism:number>
    <prism:startingPage>4278</prism:startingPage>
    <prism:endingPage>4284</prism:endingPage>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604893">
    <title>Annotating significant pairs of transcription factor binding sites in regulatory DNA</title>
    <link>http://www.citeulike.org/user/oannes/article/604893</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Annotating significant pairs of transcription factor binding sites in regulatory DNA</dc:title>

    <dc:date>2006-04-27T19:10:02-00:00</dc:date>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604892">
    <title>Genome-wide prediction and analysis of function-specific transcription factor binding sites</title>
    <link>http://www.citeulike.org/user/oannes/article/604892</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Genome-wide prediction and analysis of function-specific transcription factor binding sites</dc:title>

    <dc:date>2006-04-27T19:08:12-00:00</dc:date>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604258">
    <title>STEM: Short Time-series Expression Miner</title>
    <link>http://www.citeulike.org/user/oannes/article/604258</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>STEM: Short Time-series Expression Miner</dc:title>

    <dc:date>2006-04-27T08:04:09-00:00</dc:date>
    <prism:category>series</prism:category>
    <prism:category>time</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604257">
    <title>Statistic of Financial Markets</title>
    <link>http://www.citeulike.org/user/oannes/article/604257</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Statistic of Financial Markets</dc:title>

    <dc:date>2006-04-27T08:00:15-00:00</dc:date>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604248">
    <title>Novel technique for preprocessing high dimensional time-course data from DNA microarray: mathematical model-based clustering.</title>
    <link>http://www.citeulike.org/user/oannes/article/604248</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 7. (1 April 2006), pp. 843-848.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: Classifying genes into clusters depending on their expression profiles is one of the most important analysis techniques for microarray data. Because temporal gene expression profiles are indicative of the dynamic functional properties of genes, the application of clustering analysis to time-course data allows the more precise division of genes into functional classes. Conventional clustering methods treat the sampling data at each time point as data obtained under different experimental conditions without considering the continuity of time-course data between time periods t and t+1. Here, we propose a method designated mathematical model-based clustering (MMBC). RESULTS: The proposed method, designated MMBC, was applied to artificial data and time-course data obtained using Saccharomyces cerevisiae. Our method is able to divide data into clusters more accurately and coherently than conventional clustering methods. Furthermore, MMBC is more tolerant to noise than conventional clustering methods. AVAILABILITY: Software is available upon request. CONTACT: taizo@brs.kyushu-u.ac.jp.</description>
    <dc:title>Novel technique for preprocessing high dimensional time-course data from DNA microarray: mathematical model-based clustering.</dc:title>

    <dc:creator>K Hakamada</dc:creator>
    <dc:creator>M Okamoto</dc:creator>
    <dc:creator>T Hanai</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 7. (1 April 2006), pp. 843-848.</dc:source>
    <dc:date>2006-04-27T07:11:34-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>843</prism:startingPage>
    <prism:endingPage>848</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>course</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>time</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604247">
    <title>R: Analysis of Multiple Time Course Data</title>
    <link>http://www.citeulike.org/user/oannes/article/604247</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>R: Analysis of Multiple Time Course Data</dc:title>

    <dc:date>2006-04-27T06:58:47-00:00</dc:date>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/233328">
    <title>Differential and trajectory methods for time course gene expression data</title>
    <link>http://www.citeulike.org/user/oannes/article/233328</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 21, No. 13. (1 July 2005), pp. 3009-3016.&lt;/i&gt;</description>
    <dc:title>Differential and trajectory methods for time course gene expression data</dc:title>

    <dc:creator>Yulan Liang</dc:creator>
    <dc:creator>Bamidele Tayo</dc:creator>
    <dc:creator>Xueya Cai</dc:creator>
    <dc:creator>Arpad Kelemen</dc:creator>
    <dc:identifier>doi:10.1093/bioinformatics/bti465</dc:identifier>
    <dc:source>Bioinformatics, Vol. 21, No. 13. (1 July 2005), pp. 3009-3016.</dc:source>
    <dc:date>2005-06-21T10:29:26-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>21</prism:volume>
    <prism:number>13</prism:number>
    <prism:startingPage>3009</prism:startingPage>
    <prism:endingPage>3016</prism:endingPage>
    <prism:publisher>Oxford University Press</prism:publisher>
    <prism:category>clustering</prism:category>
    <prism:category>course</prism:category>
    <prism:category>microarray</prism:category>
    <prism:category>time</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604164">
    <title>Integrated analysis of gene expression by Association Rules Discovery.</title>
    <link>http://www.citeulike.org/user/oannes/article/604164</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 7 (2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Microarray technology is generating huge amounts of data about the expression level of thousands of genes, or even whole genomes, across different experimental conditions. To extract biological knowledge, and to fully understand such datasets, it is essential to include external biological information about genes and gene products to the analysis of expression data. However, most of the current approaches to analyze microarray datasets are mainly focused on the analysis of experimental data, and external biological information is incorporated as a posterior process. RESULTS: In this study we present a method for the integrative analysis of microarray data based on the Association Rules Discovery data mining technique. The approach integrates gene annotations and expression data to discover intrinsic associations among both data sources based on co-occurrence patterns. We applied the proposed methodology to the analysis of gene expression datasets in which genes were annotated with metabolic pathways, transcriptional regulators and Gene Ontology categories. Automatically extracted associations revealed significant relationships among these gene attributes and expression patterns, where many of them are clearly supported by recently reported work. CONCLUSION: The integration of external biological information and gene expression data can provide insights about the biological processes associated to gene expression programs. In this paper we show that the proposed methodology is able to integrate multiple gene annotations and expression data in the same analytic framework and extract meaningful associations among heterogeneous sources of data. An implementation of the method is included in the Engene software package.</description>
    <dc:title>Integrated analysis of gene expression by Association Rules Discovery.</dc:title>

    <dc:creator>P Carmona-Saez</dc:creator>
    <dc:creator>M Chagoyen</dc:creator>
    <dc:creator>A Rodriguez</dc:creator>
    <dc:creator>O Trelles</dc:creator>
    <dc:creator>JM Carazo</dc:creator>
    <dc:creator>A Pascual-Montano</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-7-54</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 7 (2006)</dc:source>
    <dc:date>2006-04-27T04:35:51-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>7</prism:volume>
    <prism:category>arm</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/604163">
    <title>A multi-step approach to time series analysis and gene expression clustering.</title>
    <link>http://www.citeulike.org/user/oannes/article/604163</link>
    <description>&lt;i&gt;Bioinformatics, Vol. 22, No. 5. (1 March 2006), pp. 589-596.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;MOTIVATION: The huge growth in gene expression data calls for the implementation of automatic tools for data processing and interpretation. RESULTS: We present a new and comprehensive machine learning data mining framework consisting in a non-linear PCA neural network for feature extraction, and probabilistic principal surfaces combined with an agglomerative approach based on Negentropy aimed at clustering gene microarray data. The method, which provides a user-friendly visualization interface, can work on noisy data with missing points and represents an automatic procedure to get, with no a priori assumptions, the number of clusters present in the data. Cell-cycle dataset and a detailed analysis confirm the biological nature of the most significant clusters. AVAILABILITY: The software described here is a subpackage part of the ASTRONEURAL package and is available upon request from the corresponding author. SUPPLEMENTARY INFORMATION: Supplementary data are available at Bioinformatics online.</description>
    <dc:title>A multi-step approach to time series analysis and gene expression clustering.</dc:title>

    <dc:creator>R Amato</dc:creator>
    <dc:creator>A Ciaramella</dc:creator>
    <dc:creator>N Deniskina</dc:creator>
    <dc:creator>C Del Mondo</dc:creator>
    <dc:creator>D di Bernardo</dc:creator>
    <dc:creator>C Donalek</dc:creator>
    <dc:creator>G Longo</dc:creator>
    <dc:creator>G Mangano</dc:creator>
    <dc:creator>G Miele</dc:creator>
    <dc:creator>G Raiconi</dc:creator>
    <dc:creator>A Staiano</dc:creator>
    <dc:creator>R Tagliaferri</dc:creator>
    <dc:source>Bioinformatics, Vol. 22, No. 5. (1 March 2006), pp. 589-596.</dc:source>
    <dc:date>2006-04-27T04:18:18-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:volume>22</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>589</prism:startingPage>
    <prism:endingPage>596</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>microarray</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/598491">
    <title>Schema for TFBS Conserved - HMR Conserved Transcription Factor Binding Sites</title>
    <link>http://www.citeulike.org/user/oannes/article/598491</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Schema for TFBS Conserved - HMR Conserved Transcription Factor Binding Sites</dc:title>

    <dc:date>2006-04-24T17:43:45-00:00</dc:date>
    <prism:category>tfbs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/oannes/article/519835">
    <title>Genome-wide prediction and characterization of interactions between transcription factors in Saccharomyces cerevisiae.</title>
    <link>http://www.citeulike.org/user/oannes/article/519835</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 34, No. 3. (2006), pp. 917-927.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Combinatorial regulation by transcription factor complexes is an important feature of eukaryotic gene regulation. Here, we propose a new method for identification of interactions between transcription factors (TFs) that relies on the relationship of their binding sites, and we test it using Saccharomyces cerevisiae as a model system. The algorithm predicts interacting TF pairs based on the co-occurrence of their binding motifs and the distance between the motifs in promoter sequences. This allows investigation of interactions between TFs without known binding motifs or expression data. With this approach, 300 significant interactions involving 77 TFs were identified. These included more than 70% of the known protein-protein interactions. Approximately half of the detected interacting motif pairs showed strong preferences for particular distances and orientations in the promoter sequences. These one dimensional features may reflect constraints on allowable spatial arrangements for protein-protein interactions. Evidence for biological relevance of the observed characteristic distances is provided by the finding that target genes with the same characteristic distances show significantly higher co-expression than those without preferred distances. Furthermore, the observed interactions were dynamic: most of the TF pairs were not constitutively active, but rather showed variable activity depending on the physiological condition of the cells. Interestingly, some TF pairs active in multiple conditions showed preferences for different distances and orientations depending on the condition. Our prediction and characterization of TF interactions may help to understand the transcriptional regulatory networks in eukaryotic systems.</description>
    <dc:title>Genome-wide prediction and characterization of interactions between transcription factors in Saccharomyces cerevisiae.</dc:title>

    <dc:creator>X Yu</dc:creator>
    <dc:creator>J Lin</dc:creator>
    <dc:creator>T Masuda</dc:creator>
    <dc:creator>N Esumi</dc:creator>
    <dc:creator>DJ Zack</dc:creator>
    <dc:creator>J Qian</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 34, No. 3. (2006), pp. 917-927.</dc:source>
    <dc:date>2006-02-24T15:58:20-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>34</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>917</prism:startingPage>
    <prism:endingPage>927</prism:endingPage>
    <prism:category>distance</prism:category>
    <prism:category>pair</prism:category>
    <prism:category>tfbs</prism:category>
</item>



</rdf:RDF>

