<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sat, 05 Jul 2008 23:14:24 BST</pubDate>


	<title>CiteULike: mariakmejia's library [54 articles]</title>
	<description>CiteULike: mariakmejia's library [54 articles]</description>


	<link>http://www.citeulike.org/user/mariakmejia</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2811217"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2811212"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2802903"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2804733"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800782"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2805447"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800447"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800446"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800442"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2798076"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800428"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800212"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800422"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800420"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800418"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2800415"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784636"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784635"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784634"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784632"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784631"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784627"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2782164"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784625"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784624"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2738967"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784622"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2784619"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2062092"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/466068"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/456205"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/106364"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/711440"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/483014"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/717214"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/715688"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/698675"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/771643"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/166875"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/684573"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/700992"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/915261"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/1285080"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/1116998"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/437270"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/238188"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2369506"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2629481"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/1145123"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/mariakmejia/article/2311222"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2811217">
    <title>GeneCAT--novel webtools that combine BLAST and co-expression analyses.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2811217</link>
    <description>&lt;i&gt;Nucleic acids research (14 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The gene co-expression analysis toolbox (GeneCAT) introduces several novel microarray data analyzing tools. First, the multigene co-expression analysis, combined with co-expressed gene networks, provides a more powerful data mining technique than standard, single-gene co-expression analysis. Second, the high-throughput Map-O-Matic tool matches co-expression pattern of multiple query genes to genes present in user-defined subdatabases, and can therefore be used for gene mapping in forward genetic screens. Third, Rosetta combines co-expression analysis with BLAST and can be used to find 'true' gene orthologs in the plant model organisms Arabidopsis thaliana and Hordeum vulgare (Barley). GeneCAT is equipped with expression data for the model plant A. thaliana, and first to introduce co-expression mining tools for the monocot Barley. GeneCAT is available at http://genecat.mpg.de.</description>
    <dc:title>GeneCAT--novel webtools that combine BLAST and co-expression analyses.</dc:title>

    <dc:creator>Marek Mutwil</dc:creator>
    <dc:creator>Jens Obro</dc:creator>
    <dc:creator>William G T Willats</dc:creator>
    <dc:creator>Staffan Persson</dc:creator>
    <dc:source>Nucleic acids research (14 May 2008)</dc:source>
    <dc:date>2008-05-18T21:56:00-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nucleic acids research</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:category>blast</prism:category>
    <prism:category>microarrays</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2811212">
    <title>SerbGO: searching for the best GO tool.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2811212</link>
    <description>&lt;i&gt;Nucleic acids research (14 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In recent years, the scientific community has provided many tools to assist with pathway analysis. Some of these programs can be used to manage functional annotation of gene products, others are oriented to exploring and analyzing data sets and many allow both possibilities. Potential users of these tools are faced with the necessity to decide which of the existing programs are the most appropriate for their needs. SerbGO is a user-friendly web tool created to facilitate this task. It can be used (i) to search for specific functionalities and determine which applications provide them and (ii) to compare several applications on the basis of different types of functionalities. Iterating and combining both functionalities can easily lead to selecting an appropriate tool. Data required by SerbGO is either the desired capabilities within a defined Standard Functionalities Set or the list of the tools to be compared. The analysis performed carries out a cross-classification that produces an easily readable output with the list of tools that implement the capabilities demanded or a table with the categorization of the GO tools that one wishes to compare. SerbGO is freely available and does not require a login. It can be accessed either directly at our server (http://estbioinfo.stat.ub.es/apli/serbgo) or at the GO Consortium website (http://www.geneontology.org/GO.tools.microarray.shtml#serbgo).</description>
    <dc:title>SerbGO: searching for the best GO tool.</dc:title>

    <dc:creator>J L Mosquera</dc:creator>
    <dc:creator>A Sánchez-Pla</dc:creator>
    <dc:source>Nucleic acids research (14 May 2008)</dc:source>
    <dc:date>2008-05-18T21:47:51-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nucleic acids research</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2802903">
    <title>Plant biology: In their neighbour's shadow</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2802903</link>
    <description>&lt;i&gt;Nature, Vol. 453, No. 7193. (14 May 2008), pp. 298-299.&lt;/i&gt;</description>
    <dc:title>Plant biology: In their neighbour's shadow</dc:title>

    <dc:creator>Ji[rbreve]í Friml</dc:creator>
    <dc:creator>Michael Sauer</dc:creator>
    <dc:identifier>doi:10.1038/453298a</dc:identifier>
    <dc:source>Nature, Vol. 453, No. 7193. (14 May 2008), pp. 298-299.</dc:source>
    <dc:date>2008-05-15T23:29:38-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:issn>0028-0836</prism:issn>
    <prism:volume>453</prism:volume>
    <prism:number>7193</prism:number>
    <prism:startingPage>298</prism:startingPage>
    <prism:endingPage>299</prism:endingPage>
    <prism:publisher>Nature Publishing Group</prism:publisher>
    <prism:category>plants</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2804733">
    <title>Widespread Translational Inhibition by Plant miRNAs and siRNAs</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2804733</link>
    <description>&lt;i&gt;Science (15 May 2008), 1159151.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;High complementarity between plant miRNAs and their mRNA targets is thought to cause silencing prevalently by endonucleolytic cleavage. We have isolated Arabidopsis mutants defective in miRNA action. Their analysis provides evidence that plant miRNA-guided silencing has a widespread translational inhibitory component that is genetically separable from endonucleolytic cleavage. We further show that the same is true of silencing mediated by short interfering (si)RNA populations. Translational repression is effected in part by the ARGONAUTE proteins AGO1 and AGO10. It also requires the activity of the microtubule-severing enzyme katanin, implicating cytoskeleton dynamics in miRNA action as recently suggested from animal studies. Also as in animals, the decapping component VCS/Ge-1 is required for translational repression by miRNAs, suggesting that the underlying mechanisms in the two kingdoms are related. 10.1126/science.1159151</description>
    <dc:title>Widespread Translational Inhibition by Plant miRNAs and siRNAs</dc:title>

    <dc:creator>Peter Brodersen</dc:creator>
    <dc:creator>Lali Sakvarelidze-Achard</dc:creator>
    <dc:creator>Marianne Bruun-Rasmussen</dc:creator>
    <dc:creator>Patrice Dunoyer</dc:creator>
    <dc:creator>Yoshiharu Yamamoto</dc:creator>
    <dc:creator>Leslie Sieburth</dc:creator>
    <dc:creator>Olivier Voinnet</dc:creator>
    <dc:identifier>doi:10.1126/science.1159151</dc:identifier>
    <dc:source>Science (15 May 2008), 1159151.</dc:source>
    <dc:date>2008-05-16T09:08:52-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Science</prism:publicationName>
    <prism:startingPage>1159151</prism:startingPage>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800782">
    <title>Use and misuse of the gene ontology annotations.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800782</link>
    <description>&lt;i&gt;Nature reviews. Genetics (13 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The Gene Ontology (GO) project is a collaboration among model organism databases to describe gene products from all organisms using a consistent and computable language. GO produces sets of explicitly defined, structured vocabularies that describe biological processes, molecular functions and cellular components of gene products in both a computer- and human-readable manner. Here we describe key aspects of GO, which, when overlooked, can cause erroneous results, and address how these pitfalls can be avoided.</description>
    <dc:title>Use and misuse of the gene ontology annotations.</dc:title>

    <dc:creator>Seung Yon Rhee</dc:creator>
    <dc:creator>Valerie Wood</dc:creator>
    <dc:creator>Kara Dolinski</dc:creator>
    <dc:creator>Sorin Draghici</dc:creator>
    <dc:identifier>doi:10.1038/nrg2363</dc:identifier>
    <dc:source>Nature reviews. Genetics (13 May 2008)</dc:source>
    <dc:date>2008-05-15T05:58:28-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nature reviews. Genetics</prism:publicationName>
    <prism:issn>1471-0064</prism:issn>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2805447">
    <title>Genetic approaches to crop improvement: responding to environmental and population changes.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2805447</link>
    <description>&lt;i&gt;Nature reviews. Genetics (13 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Crop production is threatened by global climate change, and recent demands for crops to produce bio-fuels have started to affect the worldwide supply of some of the most important foods. How can we support a growing human population in such circumstances? One potential solution is the improvement of crops to increase yield from both irrigated and non-irrigated lands, and to create novel varieties that are more tolerant to environmental stresses. Recent progress has been made in the isolation and functional analyses of genes controlling yield and tolerance to abiotic stresses. In addition, promising new methods are being developed for identifying additional genes and variants of interest and putting these to practical use in crop improvement.</description>
    <dc:title>Genetic approaches to crop improvement: responding to environmental and population changes.</dc:title>

    <dc:creator>Shin Takeda</dc:creator>
    <dc:creator>Makoto Matsuoka</dc:creator>
    <dc:identifier>doi:10.1038/nrg2342</dc:identifier>
    <dc:source>Nature reviews. Genetics (13 May 2008)</dc:source>
    <dc:date>2008-05-16T15:16:17-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nature reviews. Genetics</prism:publicationName>
    <prism:issn>1471-0064</prism:issn>
    <prism:category>genetic_regulation</prism:category>
    <prism:category>plants</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800447">
    <title>How Athila retrotransposons survive in the Arabidopsis genome</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800447</link>
    <description>&lt;i&gt;BMC Genomics, Vol. 9, No. 1. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:Transposable elements are selfish genetic sequences which only occasionally provide useful functions to their host species. In addition, models of mobile element evolution assume a second type of selfishness: elements of different familes do not cooperate, but they independently fight for their survival in the host genome.RESULTS:We show that recombination events among distantly related Athila retrotransposons have led to the generation of new Athila lineages. Their pattern of diversification suggests that Athila elements survive in Arabidopsis by a combination of selfish replication and of amplification of highly diverged copies with coding potential. Many Athila elements are non-autonomous but still conserve intact open reading frames which are under the effect of negative, purifying natural selection. CONCLUSIONS:The evolution of these mobile elements is far more complex than hitherto assumed. Strict selfish replication does not explain all the patterns observed.</description>
    <dc:title>How Athila retrotransposons survive in the Arabidopsis genome</dc:title>

    <dc:creator>Antonio Marco</dc:creator>
    <dc:creator>Ignacio Marin</dc:creator>
    <dc:identifier>doi:10.1186/1471-2164-9-219</dc:identifier>
    <dc:source>BMC Genomics, Vol. 9, No. 1. (2008)</dc:source>
    <dc:date>2008-05-15T01:18:55-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Genomics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>arabidopsis</prism:category>
    <prism:category>genomics_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800446">
    <title>Arabidopsis mRNA polyadenylation machinery: comprehensive analysis of protein-protein interactions and gene expression profiling</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800446</link>
    <description>&lt;i&gt;BMC Genomics, Vol. 9, No. 1. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:The polyadenylation of mRNA is one of the critical processing steps during expression of almost all eukaryotic genes. It is tightly integrated with transcription, particularly its termination, as well as other RNA processing events, i.e. capping and splicing. The poly(A) tail protects the mRNA from unregulated degradation, and it is required for nuclear export and translation initiation. In recent years, it has been demonstrated that the polyadenylation process is also involved in the regulation of gene expression. The polyadenylation process requires two components, the cis-elements on the mRNA and a group of protein factors that recognize the cis-elements and produce the poly(A) tail. Here we report a comprehensive pairwise protein-protein interaction mapping and gene expression profiling of the mRNA polyadenylation protein machinery in Arabidopsis. RESULTS:By protein sequence homology search using human and yeast polyadenylation factors, we identified 28 proteins that may be components of Arabidopsis polyadenylation machinery. To elucidate the protein network and their functions, we first tested their protein-protein interaction profiles. Out of 320 pair-wise protein-protein interaction assays done using the yeast two-hybrid system, 56 (~17%) showed positive interactions. 15 of these interactions were further tested, and all were confirmed by co-immunoprecipitation and/or in vitro co-purification. These interactions organize into three distinct hubs involving the Arabidopsis polyadenylation factors. These hubs are centered around AtCPSF100, AtCLPS, and AtFIPS. The first two are similar to complexes seen in mammals, while the third one stands out as unique to plants. When comparing the gene expression profiles extracted from publicly available microarray datasets, some of the polyadenylation related genes showed tissue-specific expression, suggestive of potential different polyadenylation complex configurations. CONCLUSIONS:An extensive protein network was revealed for plant polyadenylation machinery, in which all predicted proteins were found to be connecting to the complex. The gene expression profiles are indicative that specialized sub-complexes may be formed to carry out targeted processing of mRNA in different developmental stages and tissue types. These results offer a roadmap for further functional characterizations of the protein factors, and for building models when testing the genetic contributions of these genes in plant growth and development.</description>
    <dc:title>Arabidopsis mRNA polyadenylation machinery: comprehensive analysis of protein-protein interactions and gene expression profiling</dc:title>

    <dc:creator>Arthur Hunt</dc:creator>
    <dc:creator>Ruqiang Xu</dc:creator>
    <dc:creator>Balasubrahmanyam Addepalli</dc:creator>
    <dc:creator>Suryadevara Rao</dc:creator>
    <dc:creator>Kevin Forbes</dc:creator>
    <dc:creator>Lisa Meeks</dc:creator>
    <dc:creator>Denghui Xing</dc:creator>
    <dc:creator>Min Mo</dc:creator>
    <dc:creator>Hongwei Zhao</dc:creator>
    <dc:creator>Amrita Bandyopadhyay</dc:creator>
    <dc:creator>Lavanya Dampanaboina</dc:creator>
    <dc:creator>Amanda Marion</dc:creator>
    <dc:creator>Carol Von Lanken</dc:creator>
    <dc:creator>Qingshun Li</dc:creator>
    <dc:identifier>doi:10.1186/1471-2164-9-220</dc:identifier>
    <dc:source>BMC Genomics, Vol. 9, No. 1. (2008)</dc:source>
    <dc:date>2008-05-15T01:18:18-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Genomics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>arabidopsis</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800442">
    <title>U12 intron positions are more strongly conserved between animals and plants than U2 intron positions</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800442</link>
    <description>&lt;i&gt;Biology Direct, Vol. 3, No. 1. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We report that the positions of minor, U12 introns are conserved in orthologous genes from human and Arabidopsis to an even greater extent than the positions of the major, U2 introns. The U12 introns, especially, conserved ones are concentrated in 5'-portions of plant and animal genes, where the U12 to U2 conversions occurs preferentially in the 3'-portions of genes. These results are compatible with the hypothesis that the high level of conservation of U12 intron positions and their persistence in genomes despite the unidirectional U12 to U2 conversion are explained by the role of the slowly excised U12 introns in down-regulation of gene expression. Reviewers: This article was reviewed by John Logsdon and Manyuan Long. For the full reviews, please go to the Reviewers' Reports section.</description>
    <dc:title>U12 intron positions are more strongly conserved between animals and plants than U2 intron positions</dc:title>

    <dc:creator>Malay Basu</dc:creator>
    <dc:creator>Wojciech Makalowski</dc:creator>
    <dc:creator>Igor Rogozin</dc:creator>
    <dc:creator>Eugene Koonin</dc:creator>
    <dc:identifier>doi:10.1186/1745-6150-3-19</dc:identifier>
    <dc:source>Biology Direct, Vol. 3, No. 1. (2008)</dc:source>
    <dc:date>2008-05-15T01:16:52-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Biology Direct</prism:publicationName>
    <prism:volume>3</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>molecular_evolution</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2798076">
    <title>CpG island density and its correlations with genomic features in mammalian genomes</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2798076</link>
    <description>&lt;i&gt;Genome Biology, Vol. 9 (13 May 2008), R79.&lt;/i&gt;</description>
    <dc:title>CpG island density and its correlations with genomic features in mammalian genomes</dc:title>

    <dc:creator>Leng Han</dc:creator>
    <dc:creator>Bing Su</dc:creator>
    <dc:creator>Wen-Hsiung Li</dc:creator>
    <dc:creator>Zhongming Zhao</dc:creator>
    <dc:identifier>doi:10.1186/gb-2008-9-5-r79</dc:identifier>
    <dc:source>Genome Biology, Vol. 9 (13 May 2008), R79.</dc:source>
    <dc:date>2008-05-14T12:22:14-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Genome Biology</prism:publicationName>
    <prism:issn>1465-6906</prism:issn>
    <prism:volume>9</prism:volume>
    <prism:startingPage>R79</prism:startingPage>
    <prism:category>genomics_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800428">
    <title>Physiology and metabolism 'Tear down this wall'</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800428</link>
    <description>&lt;i&gt;Current opinion in plant biology (7 May 2008)&lt;/i&gt;</description>
    <dc:title>Physiology and metabolism 'Tear down this wall'</dc:title>

    <dc:creator>Markus Pauly</dc:creator>
    <dc:creator>Kenneth Keegstra</dc:creator>
    <dc:identifier>doi:10.1016/j.pbi.2008.04.002</dc:identifier>
    <dc:source>Current opinion in plant biology (7 May 2008)</dc:source>
    <dc:date>2008-05-15T01:06:34-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Current opinion in plant biology</prism:publicationName>
    <prism:issn>1369-5266</prism:issn>
    <prism:category>plants</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800212">
    <title>Regulatory change in YABBY-like transcription factor led to evolution of extreme fruit size during tomato domestication.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800212</link>
    <description>&lt;i&gt;Nature genetics (11 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Plant domestication represents an accelerated form of evolution, resulting in exaggerated changes in the tissues and organs of greatest interest to humans (for example, seeds, roots and tubers). One of the most extreme cases has been the evolution of tomato fruit. Cultivated tomato plants produce fruit as much as 1,000 times larger than those of their wild progenitors. Quantitative trait mapping studies have shown that a relatively small number of genes were involved in this dramatic transition, and these genes control two processes: cell cycle and organ number determination. The key gene in the first process has been isolated and corresponds to fw2.2, a negative regulator of cell division. However, until now, nothing was known about the molecular basis of the second process. Here, we show that the second major step in the evolution of extreme fruit size was the result of a regulatory change of a YABBY-like transcription factor (fasciated) that controls carpel number during flower and/or fruit development.</description>
    <dc:title>Regulatory change in YABBY-like transcription factor led to evolution of extreme fruit size during tomato domestication.</dc:title>

    <dc:creator>Bin Cong</dc:creator>
    <dc:creator>Luz S Barrero</dc:creator>
    <dc:creator>Steven D Tanksley</dc:creator>
    <dc:identifier>doi:10.1038/ng.144</dc:identifier>
    <dc:source>Nature genetics (11 May 2008)</dc:source>
    <dc:date>2008-05-14T22:50:24-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nature genetics</prism:publicationName>
    <prism:issn>1546-1718</prism:issn>
    <prism:category>molecular_evolution</prism:category>
    <prism:category>plants</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800422">
    <title>Pre-mRNA splicing: a complex picture in higher definition.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800422</link>
    <description>&lt;i&gt;Trends in biochemical sciences (8 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Intron excision from pre-mRNAs of higher eukaryotes requires a transition from splice-site recognition across short exons to organization of the spliceosome across long introns. Recently, insight into this transition has been provided and, in addition, it has been shown that an alternative splicing factor, the polypyrimidine-tract-binding protein, can exert its control on splice-site choice by blocking this key step in the assembly of the splicing machinery.</description>
    <dc:title>Pre-mRNA splicing: a complex picture in higher definition.</dc:title>

    <dc:creator>Matthew J Schellenberg</dc:creator>
    <dc:creator>Dustin B Ritchie</dc:creator>
    <dc:creator>Andrew M Macmillan</dc:creator>
    <dc:identifier>doi:10.1016/j.tibs.2008.04.004</dc:identifier>
    <dc:source>Trends in biochemical sciences (8 May 2008)</dc:source>
    <dc:date>2008-05-15T01:02:17-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Trends in biochemical sciences</prism:publicationName>
    <prism:issn>0968-0004</prism:issn>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800420">
    <title>Structural evolution of multisubunit RNA polymerases.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800420</link>
    <description>&lt;i&gt;Trends in microbiology (9 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Evolutionarily related multisubunit RNA polymerases (RNAPs) facilitate gene transcription throughout the three domains of life. During the past seven years an increasing number of bacterial and eukaryotic RNAP structures have been solved; however, the archaeal enzyme remained elusive. Two reports from the Murakami and Cramer laboratories have now filled this gap in our knowledge and enable us to hypothesize about the evolution of the structure and function of RNAPs.</description>
    <dc:title>Structural evolution of multisubunit RNA polymerases.</dc:title>

    <dc:creator>Finn Werner</dc:creator>
    <dc:identifier>doi:10.1016/j.tim.2008.03.008</dc:identifier>
    <dc:source>Trends in microbiology (9 May 2008)</dc:source>
    <dc:date>2008-05-15T01:01:44-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Trends in microbiology</prism:publicationName>
    <prism:issn>0966-842X</prism:issn>
    <prism:category>molecular_evolution</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800418">
    <title>Molecular evolution of the RNA polymerase II CTD.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800418</link>
    <description>&lt;i&gt;Trends in genetics : TIG (8 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In higher eukaryotes, an unusual C-terminal domain (CTD) is crucial to the function of RNA polymerase II in transcription. The CTD consists of multiple heptapeptide repeats; differences in the number of repeats between organisms and their degree of conservation have intrigued researchers for two decades. Here, we review the evolution of the CTD at the molecular level. Several primitive motifs have been integrated into compound heptads that can be readily amplified. The selection of phosphorylatable residues in the heptad repeat provided the opportunity for advanced gene regulation in eukaryotes. Current findings suggest that the CTD should be considered as a collection of continuous overlapping motifs as opposed to a specific functional unit defined by a heptad.</description>
    <dc:title>Molecular evolution of the RNA polymerase II CTD.</dc:title>

    <dc:creator>Rob D Chapman</dc:creator>
    <dc:creator>Martin Heidemann</dc:creator>
    <dc:creator>Corinna Hintermair</dc:creator>
    <dc:creator>Dirk Eick</dc:creator>
    <dc:identifier>doi:10.1016/j.tig.2008.03.010</dc:identifier>
    <dc:source>Trends in genetics : TIG (8 May 2008)</dc:source>
    <dc:date>2008-05-15T01:01:02-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Trends in genetics : TIG</prism:publicationName>
    <prism:issn>0168-9525</prism:issn>
    <prism:category>molecular_evolution</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2800415">
    <title>Circadian clock function in Arabidopsis thaliana: time beyond transcription.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2800415</link>
    <description>&lt;i&gt;Trends in cell biology (7 May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The past decade has seen a remarkable advance in our understanding of the plant circadian system, mostly in Arabidopsis thaliana. It is now well established that Arabidopsis clock genes and their protein products operate through autoregulatory feedback loops that promote rhythmic oscillations in cellular, metabolic and physiological activities. This article reviews recent studies that have provided evidence for new mechanisms of clock organization and function. These mechanisms include protein-protein interactions and the regulation of protein stability, which, together, directly connect light signalling to the Arabidopsis circadian system. Evidence of rhythmic changes in chromatin structure has also opened new and exciting ways for regulation of clock gene expression. All of these mechanisms ensure an appropriate synchronization with the environment, which is crucial for successful plant growth and development.</description>
    <dc:title>Circadian clock function in Arabidopsis thaliana: time beyond transcription.</dc:title>

    <dc:creator>Paloma Más</dc:creator>
    <dc:identifier>doi:10.1016/j.tcb.2008.03.005</dc:identifier>
    <dc:source>Trends in cell biology (7 May 2008)</dc:source>
    <dc:date>2008-05-15T00:59:08-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Trends in cell biology</prism:publicationName>
    <prism:issn>0962-8924</prism:issn>
    <prism:category>arabidopsis</prism:category>
    <prism:category>plants</prism:category>
    <prism:category>transcription</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784636">
    <title>Measuring global credibility with application to local sequence alignment.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784636</link>
    <description>&lt;i&gt;PLoS computational biology, Vol. 4, No. 5. (May 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Computational biology is replete with high-dimensional (high-D) discrete prediction and inference problems, including sequence alignment, RNA structure prediction, phylogenetic inference, motif finding, prediction of pathways, and model selection problems in statistical genetics. Even though prediction and inference in these settings are uncertain, little attention has been focused on the development of global measures of uncertainty. Regardless of the procedure employed to produce a prediction, when a procedure delivers a single answer, that answer is a point estimate selected from the solution ensemble, the set of all possible solutions. For high-D discrete space, these ensembles are immense, and thus there is considerable uncertainty. We recommend the use of Bayesian credibility limits to describe this uncertainty, where a (1-alpha)%, 0&#60;/=alpha&#60;/=1, credibility limit is the minimum Hamming distance radius of a hyper-sphere containing (1-alpha)% of the posterior distribution. Because sequence alignment is arguably the most extensively used procedure in computational biology, we employ it here to make these general concepts more concrete. The maximum similarity estimator (i.e., the alignment that maximizes the likelihood) and the centroid estimator (i.e., the alignment that minimizes the mean Hamming distance from the posterior weighted ensemble of alignments) are used to demonstrate the application of Bayesian credibility limits to alignment estimators. Application of Bayesian credibility limits to the alignment of 20 human/rodent orthologous sequence pairs and 125 orthologous sequence pairs from six Shewanella species shows that credibility limits of the alignments of promoter sequences of these species vary widely, and that centroid alignments dependably have tighter credibility limits than traditional maximum similarity alignments.</description>
    <dc:title>Measuring global credibility with application to local sequence alignment.</dc:title>

    <dc:creator>BJ Webb-Robertson</dc:creator>
    <dc:creator>LA McCue</dc:creator>
    <dc:creator>CE Lawrence</dc:creator>
    <dc:identifier>doi:10.1371/journal.pcbi.1000077</dc:identifier>
    <dc:source>PLoS computational biology, Vol. 4, No. 5. (May 2008)</dc:source>
    <dc:date>2008-05-11T16:25:06-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>PLoS computational biology</prism:publicationName>
    <prism:issn>1553-7358</prism:issn>
    <prism:volume>4</prism:volume>
    <prism:number>5</prism:number>
    <prism:category>alignment</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784635">
    <title>Exploiting and integrating rich features for biological literature classification.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784635</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 3 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Efficient features play an important role in automated text classification, which definitely facilitates the access of large-scale data. In the bioscience field, biological structures and terminologies are described by a large number of features; domain dependent features would significantly improve the classification performance. How to effectively select and integrate different types of features to improve the biological literature classification performance is the major issue studied in this paper. RESULTS: To efficiently classify the biological literatures, we propose a novel feature value schema TF*ML, features covering from lower level domain independent &#34;string feature&#34; to higher level domain dependent &#34;semantic template feature&#34;, and proper integrations among the features. Compared to our previous approaches, the performance is improved in terms of AUC and F-Score by 11.5% and 8.8% respectively, and outperforms the best performance achieved in BioCreAtIvE 2006. CONCLUSIONS: Different types of features possess different discriminative capabilities in literature classification; proper integration of domain independent and dependent features would significantly improve the performance and overcome the over-fitting on data distribution.</description>
    <dc:title>Exploiting and integrating rich features for biological literature classification.</dc:title>

    <dc:creator>H Wang</dc:creator>
    <dc:creator>M Huang</dc:creator>
    <dc:creator>S Ding</dc:creator>
    <dc:creator>X Zhu</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S4</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 3 (2008)</dc:source>
    <dc:date>2008-05-11T16:24:44-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 3</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784634">
    <title>Identification of transcription factor contexts in literature using machine learning approaches.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784634</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 3 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Availability of information about transcription factors (TFs) is crucial for genome biology, as TFs play a central role in the regulation of gene expression. While manual literature curation is expensive and labour intensive, the development of semi-automated text mining support is hindered by unavailability of training data. There have been no studies on how existing data sources (e.g. TF-related data from the MeSH thesaurus and GO ontology) or potentially noisy example data (e.g. protein-protein interaction, PPI) could be used to provide training data for identification of TF-contexts in literature. RESULTS: In this paper we describe a text-classification system designed to automatically recognise contexts related to transcription factors in literature. A learning model is based on a set of biological features (e.g. protein and gene names, interaction words, other biological terms) that are deemed relevant for the task. We have exploited background knowledge from existing biological resources (MeSH and GO) to engineer such features. Weak and noisy training datasets have been collected from descriptions of TF-related concepts in MeSH and GO, PPI data and data representing non-protein-function descriptions. Three machine-learning methods are investigated, along with a vote-based merging of individual approaches and/or different training datasets. The system achieved highly encouraging results, with most classifiers achieving an F-measure above 90%. CONCLUSIONS: The experimental results have shown that the proposed model can be used for identification of TF-related contexts (i.e. sentences) with high accuracy, with a significantly reduced set of features when compared to traditional bag-of-words approach. The results of considering existing PPI data suggest that there is not as high similarity between TF and PPI contexts as we have expected. We have also shown that existing knowledge sources are useful both for feature engineering and for obtaining noisy positive training data.</description>
    <dc:title>Identification of transcription factor contexts in literature using machine learning approaches.</dc:title>

    <dc:creator>H Yang</dc:creator>
    <dc:creator>G Nenadic</dc:creator>
    <dc:creator>JA Keane</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S11</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 3 (2008)</dc:source>
    <dc:date>2008-05-11T16:24:32-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 3</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784632">
    <title>New challenges for text mining: mapping between text and manually curated pathways.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784632</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 3 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Associating literature with pathways poses new challenges to the Text Mining (TM) community. There are three main challenges to this task: (1) the identification of the mapping position of a specific entity or reaction in a given pathway, (2) the recognition of the causal relationships among multiple reactions, and (3) the formulation and implementation of required inferences based on biological domain knowledge. RESULTS: To address these challenges, we constructed new resources to link the text with a model pathway; they are: the GENIA pathway corpus with event annotation and NF-kB pathway. Through their detailed analysis, we address the untapped resource, 'bio-inference,' as well as the differences between text and pathway representation. Here, we show the precise comparisons of their representations and the nine classes of 'bio-inference' schemes observed in the pathway corpus. CONCLUSIONS: We believe that the creation of such rich resources and their detailed analysis is the significant first step for accelerating the research of the automatic construction of pathway from text.</description>
    <dc:title>New challenges for text mining: mapping between text and manually curated pathways.</dc:title>

    <dc:creator>K Oda</dc:creator>
    <dc:creator>JD Kim</dc:creator>
    <dc:creator>T Ohta</dc:creator>
    <dc:creator>D Okanohara</dc:creator>
    <dc:creator>T Matsuzaki</dc:creator>
    <dc:creator>Y Tateisi</dc:creator>
    <dc:creator>J Tsujii</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S5</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 3 (2008)</dc:source>
    <dc:date>2008-05-11T16:24:10-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 3</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784631">
    <title>Gene Ontology density estimation and discourse analysis for automatic GeneRiF extraction.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784631</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 3 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: This paper describes and evaluates a sentence selection engine that extracts a GeneRiF (Gene Reference into Functions) as defined in ENTREZ-Gene based on a MEDLINE record. Inputs for this task include both a gene and a pointer to a MEDLINE reference. In the suggested approach we merge two independent sentence extraction strategies. The first proposed strategy (LASt) uses argumentative features, inspired by discourse-analysis models. The second extraction scheme (GOEx) uses an automatic text categorizer to estimate the density of Gene Ontology categories in every sentence; thus providing a full ranking of all possible candidate GeneRiFs. A combination of the two approaches is proposed, which also aims at reducing the size of the selected segment by filtering out non-content bearing rhetorical phrases. RESULTS: Based on the TREC-2003 Genomics collection for GeneRiF identification, the LASt extraction strategy is already competitive (52.78%). When used in a combined approach, the extraction task clearly shows improvement, achieving a Dice score of over 57% (+10%). CONCLUSIONS: Argumentative representation levels and conceptual density estimation using Gene Ontology contents appear complementary for functional annotation in proteomics.</description>
    <dc:title>Gene Ontology density estimation and discourse analysis for automatic GeneRiF extraction.</dc:title>

    <dc:creator>J Gobeill</dc:creator>
    <dc:creator>I Tbahriti</dc:creator>
    <dc:creator>F Ehrler</dc:creator>
    <dc:creator>A Mottaz</dc:creator>
    <dc:creator>AL Veuthey</dc:creator>
    <dc:creator>P Ruch</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S9</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 3 (2008)</dc:source>
    <dc:date>2008-05-11T16:23:57-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 3</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784627">
    <title>RDFScape: Semantic Web meets systems biology.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784627</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 4 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: The recent availability of high-throughput data in molecular biology has increased the need for a formal representation of this knowledge domain. New ontologies are being developed to formalize knowledge, e.g. about the functions of proteins. As the Semantic Web is being introduced into the Life Sciences, the basis for a distributed knowledge-base that can foster biological data analysis is laid. However, there still is a dichotomy, in tools and methodologies, between the use of ontologies in biological investigation, that is, in relation to experimental observations, and their use as a knowledge-base. RESULTS: RDFScape is a plugin that has been developed to extend a software oriented to biological analysis with support for reasoning on ontologies in the semantic web framework. We show with this plugin how the use of ontological knowledge in biological analysis can be extended through the use of inference. In particular, we present two examples relative to ontologies representing biological pathways: we demonstrate how these can be abstracted and visualized as interaction networks, and how reasoning on causal dependencies within elements of pathways can be implemented. CONCLUSIONS: The use of ontologies for the interpretation of high-throughput biological data can be improved through the use of inference. This allows the use of ontologies not only as annotations, but as a knowledge-base from which new information relevant for specific analysis can be derived.</description>
    <dc:title>RDFScape: Semantic Web meets systems biology.</dc:title>

    <dc:creator>A Splendiani</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S4-S6</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 4 (2008)</dc:source>
    <dc:date>2008-05-11T16:22:53-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 4</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2782164">
    <title>Bioinformatic analyses of mammalian 5'-UTR sequence properties of mRNAs predicts alternative translation initiation sites</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2782164</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 9 (08 May 2008), 232.&lt;/i&gt;</description>
    <dc:title>Bioinformatic analyses of mammalian 5'-UTR sequence properties of mRNAs predicts alternative translation initiation sites</dc:title>

    <dc:creator>Jill Wegrzyn</dc:creator>
    <dc:creator>Thomas Drudge</dc:creator>
    <dc:creator>Faramarz Valafar</dc:creator>
    <dc:creator>Vivian Hook</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-232</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 9 (08 May 2008), 232.</dc:source>
    <dc:date>2008-05-10T00:57:17-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9</prism:volume>
    <prism:startingPage>232</prism:startingPage>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784625">
    <title>Metrics for GO based protein semantic similarity: a systematic evaluation.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784625</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 5 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Several semantic similarity measures have been applied to gene products annotated with Gene Ontology terms, providing a basis for their functional comparison. However, it is still unclear which is the best approach to semantic similarity in this context, since there is no conclusive evaluation of the various measures. Another issue, is whether electronic annotations should or not be used in semantic similarity calculations. RESULTS: We conducted a systematic evaluation of GO-based semantic similarity measures using the relationship with sequence similarity as a means to quantify their performance, and assessed the influence of electronic annotations by testing the measures in the presence and absence of these annotations. We verified that the relationship between semantic and sequence similarity is not linear, but can be well approximated by a rescaled Normal cumulative distribution function. Given that the majority of the semantic similarity measures capture an identical behaviour, but differ in resolution, we used the latter as the main criterion of evaluation. CONCLUSIONS: This work has provided a basis for the comparison of several semantic similarity measures, and can aid researchers in choosing the most adequate measure for their work. We have found that the hybrid simGIC was the measure with the best overall performance, followed by Resnik's measure using a best-match average combination approach. We have also found that the average and maximum combination approaches are problematic since both are inherently influenced by the number of terms being combined. We suspect that there may be a direct influence of data circularity in the behaviour of the results including electronic annotations, as a result of functional inference from sequence similarity.</description>
    <dc:title>Metrics for GO based protein semantic similarity: a systematic evaluation.</dc:title>

    <dc:creator>C Pesquita</dc:creator>
    <dc:creator>D Faria</dc:creator>
    <dc:creator>H Bastos</dc:creator>
    <dc:creator>AE Ferreira</dc:creator>
    <dc:creator>AO Falcão</dc:creator>
    <dc:creator>FM Couto</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S5-S4</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 5 (2008)</dc:source>
    <dc:date>2008-05-11T16:22:05-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 5</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784624">
    <title>Gene Ontology annotations: what they mean and where they come from.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784624</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 5 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;To address the challenges of information integration and retrieval, the computational genomics community increasingly has come to rely on the methodology of creating annotations of scientific literature using terms from controlled structured vocabularies such as the Gene Ontology (GO). Here we address the question of what such annotations signify and of how they are created by working biologists. Our goal is to promote a better understanding of how the results of experiments are captured in annotations, in the hope that this will lead both to better representations of biological reality through annotation and ontology development and to more informed use of GO resources by experimental scientists.</description>
    <dc:title>Gene Ontology annotations: what they mean and where they come from.</dc:title>

    <dc:creator>DP Hill</dc:creator>
    <dc:creator>B Smith</dc:creator>
    <dc:creator>MS McAndrews-Hill</dc:creator>
    <dc:creator>JA Blake</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S5-S2</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 5 (2008)</dc:source>
    <dc:date>2008-05-11T16:21:46-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 5</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2738967">
    <title>Ontology-guided data preparation for discovering genotype-phenotype relationships</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2738967</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 9, No. Suppl 4. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:Complexity and amount of post-genomic data constitute two major factors limiting the application of Knowledge Discovery in Databases (KDD) methods in life sciences. Bio-ontologies may nowadays play key roles in knowledge discovery in life science providing semantics to data and to extracted units, by taking advantage of the progress of Semantic Web technologies concerning the understanding and availability of tools for knowledge representation, extraction, and reasoning.RESULTS:This paper presents a method that exploits bio-ontologies for guiding data selection within the preparation step of the KDD process. We propose three scenarios in which domain knowledge and ontology elements such as subsumption, properties, class descriptions, are taken into account for data selection, before the data mining step. Each of these scenarios is illustrated within a case-study relative to the search of genotype-phenotype relationships in a familial hypercholesterolemia dataset. The guiding of data selection based on domain knowledge is analysed and shows a direct influence on the volume and significance of the data mining results.CONCLUSIONS:The method proposed in this paper is an efficient alternative to numerical methods for data selection based on domain knowledge. In turn, the results of this study may be reused in ontology modelling and data integration.</description>
    <dc:title>Ontology-guided data preparation for discovering genotype-phenotype relationships</dc:title>

    <dc:creator>Adrien Coulet</dc:creator>
    <dc:creator>Malika Tabbone</dc:creator>
    <dc:creator>Pascale Benlian</dc:creator>
    <dc:creator>Amedeo Napoli</dc:creator>
    <dc:creator>Marie Devignes</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S4-S3</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 9, No. Suppl 4. (2008)</dc:source>
    <dc:date>2008-04-30T15:14:25-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>Suppl 4</prism:number>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784622">
    <title>Terminologies for text-mining; an experiment in the lipoprotein metabolism domain.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784622</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 4 (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: The engineering of ontologies, especially with a view to a text-mining use, is still a new research field. There does not yet exist a well-defined theory and technology for ontology construction. Many of the ontology design steps remain manual and are based on personal experience and intuition. However, there exist a few efforts on automatic construction of ontologies in the form of extracted lists of terms and relations between them. RESULTS: We share experience acquired during the manual development of a lipoprotein metabolism ontology (LMO) to be used for text-mining. We compare the manually created ontology terms with the automatically derived terminology from four different automatic term recognition (ATR) methods. The top 50 predicted terms contain up to 89% relevant terms. For the top 1000 terms the best method still generates 51% relevant terms. In a corpus of 3066 documents 53% of LMO terms are contained and 38% can be generated with one of the methods. CONCLUSIONS: Given high precision, automatic methods can help decrease development time and provide significant support for the identification of domain-specific vocabulary. The coverage of the domain vocabulary depends strongly on the underlying documents. Ontology development for text mining should be performed in a semi-automatic way; taking ATR results as input and following the guidelines we described. AVAILABILITY: The TFIDF term recognition is available as Web Service, described at http://gopubmed4.biotec.tu-dresden.de/IdavollWebService/services/CandidateTermGeneratorService?wsdl.</description>
    <dc:title>Terminologies for text-mining; an experiment in the lipoprotein metabolism domain.</dc:title>

    <dc:creator>D Alexopoulou</dc:creator>
    <dc:creator>T Wächter</dc:creator>
    <dc:creator>L Pickersgill</dc:creator>
    <dc:creator>C Eyre</dc:creator>
    <dc:creator>M Schroeder</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S4-S2</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 4 (2008)</dc:source>
    <dc:date>2008-05-11T16:18:25-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 4</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2784619">
    <title>A Semantic Web for bioinformatics: goals, tools, systems, applications.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2784619</link>
    <description>&lt;i&gt;BMC bioinformatics, Vol. 9 Suppl 4 (2008)&lt;/i&gt;</description>
    <dc:title>A Semantic Web for bioinformatics: goals, tools, systems, applications.</dc:title>

    <dc:creator>N Cannata</dc:creator>
    <dc:creator>M Schröder</dc:creator>
    <dc:creator>R Marangoni</dc:creator>
    <dc:creator>P Romano</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S4-S1</dc:identifier>
    <dc:source>BMC bioinformatics, Vol. 9 Suppl 4 (2008)</dc:source>
    <dc:date>2008-05-11T16:16:58-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>9 Suppl 4</prism:volume>
    <prism:category>semantic_web</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2062092">
    <title>Novel motifs in amino acid permease genes from Leishmania</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2062092</link>
    <description>&lt;i&gt;Biochemical and Biophysical Research Communications, Vol. 325, No. 1. (3 December 2004), pp. 353-366.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Eight amino acid permease genes from the protozoan parasite Leishmania donovani (AAPLDs) were cloned, sequenced, and shown to be expressed in promastigotes. Seven of these belong to the amino acid transporter-1 and one to the amino acid polyamino-choline superfamilies. Using these sequences as well as known and characterized amino acid permease genes from all kingdoms, a training set was established and used to search for motifs, using the MEME motif discovery tool. This study revealed two motifs that are specific to the genus Leishmania, four to the family trypanosomatidae, and a single motif that is common between trypanosomatidae and mammalian systems A1 and N. Interestingly, most of these motifs are clustered in two regions of 50-60 amino acids. Blast search analyses indicated a close relationship between the L. donovani and Trypanosoma brucei amino acid permeases. The results of this work describe the cloning of the first amino acid permease genes in parasitic protozoa and contribute to the understanding of amino acid permease evolution in these organisms. Furthermore, the identification of genus-specific motifs in these proteins might be useful to better understand parasite physiology within its hosts.</description>
    <dc:title>Novel motifs in amino acid permease genes from Leishmania</dc:title>

    <dc:creator>Martin Akerman</dc:creator>
    <dc:creator>Pninit Shaked-Mishan</dc:creator>
    <dc:creator>Salam Mazareb</dc:creator>
    <dc:creator>Hanne Volpin</dc:creator>
    <dc:creator>Dan Zilberstein</dc:creator>
    <dc:identifier>doi:10.1016/j.bbrc.2004.09.212</dc:identifier>
    <dc:source>Biochemical and Biophysical Research Communications, Vol. 325, No. 1. (3 December 2004), pp. 353-366.</dc:source>
    <dc:date>2007-12-05T15:49:09-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Biochemical and Biophysical Research Communications</prism:publicationName>
    <prism:volume>325</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>353</prism:startingPage>
    <prism:endingPage>366</prism:endingPage>
    <prism:category>leishmaniasis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/466068">
    <title>Transcriptional regulatory code of a eukaryotic genome</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/466068</link>
    <description>&lt;i&gt;Nature, Vol. 431, No. 7004. (2004), pp. 99-104.&lt;/i&gt;</description>
    <dc:title>Transcriptional regulatory code of a eukaryotic genome</dc:title>

    <dc:creator>Christopher Harbison</dc:creator>
    <dc:creator>Benjamin Gordon</dc:creator>
    <dc:creator>Tong Lee</dc:creator>
    <dc:creator>Nicola Rinaldi</dc:creator>
    <dc:creator>Kenzie Macisaac</dc:creator>
    <dc:creator>Timothy Danford</dc:creator>
    <dc:creator>Nancy Hannett</dc:creator>
    <dc:creator>Jean-Bosco Tagne</dc:creator>
    <dc:creator>David Reynolds</dc:creator>
    <dc:creator>Jane Yoo</dc:creator>
    <dc:creator>Ezra Jennings</dc:creator>
    <dc:creator>Julia Zeitlinger</dc:creator>
    <dc:creator>Dmitry Pokholok</dc:creator>
    <dc:creator>Manolis Kellis</dc:creator>
    <dc:creator>Alex Rolfe</dc:creator>
    <dc:creator>Ken Takusagawa</dc:creator>
    <dc:creator>Eric Lander</dc:creator>
    <dc:creator>David Gifford</dc:creator>
    <dc:creator>Ernest Fraenkel</dc:creator>
    <dc:creator>Richard Young</dc:creator>
    <dc:identifier>doi:10.1038/nature02800</dc:identifier>
    <dc:source>Nature, Vol. 431, No. 7004. (2004), pp. 99-104.</dc:source>
    <dc:date>2006-01-16T14:50:46-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:volume>431</prism:volume>
    <prism:number>7004</prism:number>
    <prism:startingPage>99</prism:startingPage>
    <prism:endingPage>104</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/456205">
    <title>DBD: a transcription factor prediction database.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/456205</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 34, No. Database issue. (1 January 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Regulation of gene expression influences almost all biological processes in an organism; sequence-specific DNA-binding transcription factors are critical to this control. For most genomes, the repertoire of transcription factors is only partially known. Hitherto transcription factor identification has been largely based on genome annotation pipelines that use pairwise sequence comparisons, which detect only those factors similar to known genes, or on functional classification schemes that amalgamate many types of proteins into the category of 'transcription factor'. Using a novel transcription factor identification method, the DBD transcription factor database fills this void, providing genome-wide transcription factor predictions for organisms from across the tree of life. The prediction method behind DBD identifies sequence-specific DNA-binding transcription factors through homology using profile hidden Markov models (HMMs) of domains. Thus, it is limited to factors that are homologus to those HMMs. The collection of HMMs is taken from two existing databases (Pfam and SUPERFAMILY), and is limited to models that exclusively detect transcription factors that specifically recognize DNA sequences. It does not include basal transcription factors or chromatin-associated proteins, for instance. Based on comparison with experimentally verified annotation, the prediction procedure is between 95% and 99% accurate. Between one quarter and one-half of our genome-wide predicted transcription factors represent previously uncharacterized proteins. The DBD (www.transcriptionfactor.org) consists of predicted transcription factor repertoires for 150 completely sequenced genomes, their domain assignments and the hand curated list of DNA-binding domain HMMs. Users can browse, search or download the predictions by genome, domain family or sequence identifier, view families of transcription factors based on domain architecture and receive predictions for a protein sequence.</description>
    <dc:title>DBD: a transcription factor prediction database.</dc:title>

    <dc:creator>SK Kummerfeld</dc:creator>
    <dc:creator>SA Teichmann</dc:creator>
    <dc:source>Nucleic Acids Res, Vol. 34, No. Database issue. (1 January 2006)</dc:source>
    <dc:date>2006-01-05T12:53:50-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>34</prism:volume>
    <prism:number>Database issue</prism:number>
    <prism:category>database</prism:category>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/106364">
    <title>Systematic discovery of regulatory motifs in human promoters and 3[prime] UTRs by comparison of several mammals</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/106364</link>
    <description>&lt;i&gt;Nature, Vol. aop, No. current. (27 February 2005)&lt;/i&gt;</description>
    <dc:title>Systematic discovery of regulatory motifs in human promoters and 3[prime] UTRs by comparison of several mammals</dc:title>

    <dc:creator>Xiaohui Xie</dc:creator>
    <dc:creator>Jun Lu</dc:creator>
    <dc:creator>EJ Kulbokas</dc:creator>
    <dc:creator>Todd Golub</dc:creator>
    <dc:creator>Vamsi Mootha</dc:creator>
    <dc:creator>Kerstin Lindblad-Toh</dc:creator>
    <dc:creator>Eric Lander</dc:creator>
    <dc:creator>Manolis Kellis</dc:creator>
    <dc:identifier>doi:10.1038/nature03441</dc:identifier>
    <dc:source>Nature, Vol. aop, No. current. (27 February 2005)</dc:source>
    <dc:date>2005-02-28T05:59:22-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:issn>0028-0836</prism:issn>
    <prism:volume>aop</prism:volume>
    <prism:number>current</prism:number>
    <prism:publisher>Nature Publishing Group</prism:publisher>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/711440">
    <title>An ORFeome-based analysis of human transcription factor genes and the construction of a microarray to interrogate their expression.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/711440</link>
    <description>&lt;i&gt;Genome Res, Vol. 14, No. 10B. (October 2004), pp. 2041-2047.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Transcription factors (TFs) are essential regulators of gene expression, and mutated TF genes have been shown to cause numerous human genetic diseases. Yet to date, no single, comprehensive database of human TFs exists. In this work, we describe the collection of an essentially complete set of TF genes from one depiction of the human ORFeome, and the design of a microarray to interrogate their expression. Taking 1468 known TFs from TRANSFAC, InterPro, and FlyBase, we used this seed set to search the ScriptSure human transcriptome database for additional genes. ScriptSure's genome-anchored transcript clusters allowed us to work with a nonredundant high-quality representation of the human transcriptome. We used a high-stringency similarity search by using BLASTN, and a protein motif search of the human ORFeome by using hidden Markov models of DNA-binding domains known to occur exclusively or primarily in TFs. Four hundred ninety-four additional TF genes were identified in the overlap between the two searches, bringing our estimate of the total number of human TFs to 1962. Zinc finger genes are by far the most abundant family (762 members), followed by homeobox (199 members) and basic helix-loop-helix genes (117 members). We designed a microarray of 50-mer oligonucleotide probes targeted to a unique region of the coding sequence of each gene. We have successfully used this microarray to interrogate TF gene expression in species as diverse as chickens and mice, as well as in humans.</description>
    <dc:title>An ORFeome-based analysis of human transcription factor genes and the construction of a microarray to interrogate their expression.</dc:title>

    <dc:creator>DN Messina</dc:creator>
    <dc:creator>J Glasscock</dc:creator>
    <dc:creator>W Gish</dc:creator>
    <dc:creator>M Lovett</dc:creator>
    <dc:identifier>doi:10.1101/gr.2584104</dc:identifier>
    <dc:source>Genome Res, Vol. 14, No. 10B. (October 2004), pp. 2041-2047.</dc:source>
    <dc:date>2006-06-26T15:41:16-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Genome Res</prism:publicationName>
    <prism:issn>1088-9051</prism:issn>
    <prism:volume>14</prism:volume>
    <prism:number>10B</prism:number>
    <prism:startingPage>2041</prism:startingPage>
    <prism:endingPage>2047</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/483014">
    <title>Defining transcriptional networks through integrative modeling of mRNA expression and transcription factor binding data.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/483014</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 5 (18 March 2004)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: Functional genomics studies are yielding information about regulatory processes in the cell at an unprecedented scale. In the yeast S. cerevisiae, DNA microarrays have not only been used to measure the mRNA abundance for all genes under a variety of conditions but also to determine the occupancy of all promoter regions by a large number of transcription factors. The challenge is to extract useful information about the global regulatory network from these data. RESULTS: We present MA-Networker, an algorithm that combines microarray data for mRNA expression and transcription factor occupancy to define the regulatory network of the cell. Multivariate regression analysis is used to infer the activity of each transcription factor, and the correlation across different conditions between this activity and the mRNA expression of a gene is interpreted as regulatory coupling strength. Applying our method to S. cerevisiae, we find that, on average, 58% of the genes whose promoter region is bound by a transcription factor are true regulatory targets. These results are validated by an analysis of enrichment for functional annotation, response for transcription factor deletion, and over-representation of cis-regulatory motifs. We are able to assign directionality to transcription factors that control divergently transcribed genes sharing the same promoter region. Finally, we identify an intrinsic limitation of transcription factor deletion experiments related to the combinatorial nature of transcriptional control, to which our approach provides an alternative. CONCLUSION: Our reliable classification of ChIP positives into functional and non-functional TF targets based on their expression pattern across a wide range of conditions provides a starting point for identifying the unknown sequence features in non-coding DNA that directly or indirectly determine the context dependence of transcription factor action. Complete analysis results are available for browsing or download at http://bussemaker.bio.columbia.edu/papers/MA-Networker/.</description>
    <dc:title>Defining transcriptional networks through integrative modeling of mRNA expression and transcription factor binding data.</dc:title>

    <dc:creator>F Gao</dc:creator>
    <dc:creator>BC Foat</dc:creator>
    <dc:creator>HJ Bussemaker</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-5-31</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 5 (18 March 2004)</dc:source>
    <dc:date>2006-01-27T18:07:26-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:issn>1471-2105</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/717214">
    <title>Integrated assessment and prediction of transcription factor binding.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/717214</link>
    <description>&lt;i&gt;PLoS Comput Biol, Vol. 2, No. 6. (16 June 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Systematic chromatin immunoprecipitation (chIP-chip) experiments have become a central technique for mapping transcriptional interactions in model organisms and humans. However, measurement of chromatin binding does not necessarily imply regulation, and binding may be difficult to detect if it is condition or cofactor dependent. To address these challenges, we present an approach for reliably assigning transcription factors (TFs) to target genes that integrates many lines of direct and indirect evidence into a single probabilistic model. Using this approach, we analyze publicly available chIP-chip binding profiles measured for yeast TFs in standard conditions, showing that our model interprets these data with significantly higher accuracy than previous methods. Pooling the high-confidence interactions reveals a large network containing 363 significant sets of factors (TF modules) that cooperate to regulate common target genes. In addition, the method predicts 980 novel binding interactions with high confidence that are likely to occur in so-far untested conditions. Indeed, using new chIP-chip experiments we show that predicted interactions for the factors Rpn4p and Pdr1p are observed only after treatment of cells with methyl-methanesulfonate, a DNA-damaging agent. We outline the first approach for consistently integrating all available evidences for TF-target interactions and we comprehensively identify the resulting TF module hierarchy. Prioritizing experimental conditions for each factor will be especially important as increasing numbers of chIP-chip assays are performed in complex organisms such as humans, for which &#34;standard conditions&#34; are ill defined.</description>
    <dc:title>Integrated assessment and prediction of transcription factor binding.</dc:title>

    <dc:creator>A Beyer</dc:creator>
    <dc:creator>C Workman</dc:creator>
    <dc:creator>J Hollunder</dc:creator>
    <dc:creator>D Radke</dc:creator>
    <dc:creator>U Möller</dc:creator>
    <dc:creator>T Wilhelm</dc:creator>
    <dc:creator>T Ideker</dc:creator>
    <dc:identifier>doi:10.1371/journal.pcbi.0020070</dc:identifier>
    <dc:source>PLoS Comput Biol, Vol. 2, No. 6. (16 June 2006)</dc:source>
    <dc:date>2006-06-30T09:45:02-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>PLoS Comput Biol</prism:publicationName>
    <prism:issn>1553-7358</prism:issn>
    <prism:volume>2</prism:volume>
    <prism:number>6</prism:number>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/715688">
    <title>REDUCE: An online tool for inferring cis-regulatory elements and transcriptional module activities from microarray data.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/715688</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 31, No. 13. (1 July 2003), pp. 3487-3490.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;REDUCE is a motif-based regression method for microarray analysis. The only required inputs are (i) a single genome-wide set of absolute or relative mRNA abundances and (ii) the DNA sequence of the regulatory region associated with each gene that is probed. Currently supported organisms are yeast, worm and fly; it is an open question whether in its current incarnation our approach can be used for mouse or human. REDUCE uses unbiased statistics to identify oligonucleotide motifs whose occurrence in the regulatory region of a gene correlates with the level of mRNA expression. Regression analysis is used to infer the activity of the transcriptional module associated with each motif. REDUCE is available online at http://bussemaker.bio.columbia.edu/reduce/. This web site provides functionality for the upload and management of microarray data. REDUCE analysis results can be viewed and downloaded, and optionally be shared with other users or made publicly accessible.</description>
    <dc:title>REDUCE: An online tool for inferring cis-regulatory elements and transcriptional module activities from microarray data.</dc:title>

    <dc:creator>C Roven</dc:creator>
    <dc:creator>HJ Bussemaker</dc:creator>
    <dc:identifier>doi:10.1093/nar/gkg630</dc:identifier>
    <dc:source>Nucleic Acids Res, Vol. 31, No. 13. (1 July 2003), pp. 3487-3490.</dc:source>
    <dc:date>2006-06-29T13:53:41-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>1362-4962</prism:issn>
    <prism:volume>31</prism:volume>
    <prism:number>13</prism:number>
    <prism:startingPage>3487</prism:startingPage>
    <prism:endingPage>3490</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/698675">
    <title>Close sequence comparisons are sufficient to identify human cis-regulatory elements.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/698675</link>
    <description>&lt;i&gt;Genome Res (12 June 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Cross-species DNA sequence comparison is the primary method used to identify functional noncoding elements in human and other large genomes. However, little is known about the relative merits of evolutionarily close and distant sequence comparisons. To address this problem, we identified evolutionarily conserved noncoding regions in primate, mammalian, and more distant comparisons using a uniform approach (Gumby) that facilitates unbiased assessment of the impact of evolutionary distance on predictive power. We benchmarked computational predictions against previously identified cis-regulatory elements at diverse genomic loci and also tested numerous extremely conserved human-rodent sequences for transcriptional enhancer activity using an in vivo enhancer assay in transgenic mice. Human regulatory elements were identified with acceptable sensitivity (53%-80%) and true-positive rate (27%-67%) by comparison with one to five other eutherian mammals or six other simian primates. More distant comparisons (marsupial, avian, amphibian, and fish) failed to identify many of the empirically defined functional noncoding elements. Our results highlight the practical utility of close sequence comparisons, and the loss of sensitivity entailed by more distant comparisons. We derived an intuitive relationship between ancient and recent noncoding sequence conservation from whole-genome comparative analysis that explains most of the observations from empirical benchmarking. Lastly, we determined that, in addition to strength of conservation, genomic location and/or density of surrounding conserved elements must also be considered in selecting candidate enhancers for in vivo testing at embryonic time points.</description>
    <dc:title>Close sequence comparisons are sufficient to identify human cis-regulatory elements.</dc:title>

    <dc:creator>Shyam Prabhakar</dc:creator>
    <dc:creator>Francis Poulin</dc:creator>
    <dc:creator>Malak Shoukry</dc:creator>
    <dc:creator>Veena Afzal</dc:creator>
    <dc:creator>Edward M Rubin</dc:creator>
    <dc:creator>Olivier Couronne</dc:creator>
    <dc:creator>Len A Pennacchio</dc:creator>
    <dc:identifier>doi:10.1101/gr.4717506</dc:identifier>
    <dc:source>Genome Res (12 June 2006)</dc:source>
    <dc:date>2006-06-16T19:46:25-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Genome Res</prism:publicationName>
    <prism:issn>1088-9051</prism:issn>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/771643">
    <title>Functional analysis of human and chimpanzee promoters.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/771643</link>
    <description>&lt;i&gt;Genome Biol, Vol. 6, No. 7. (2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND: It has long been argued that changes in gene expression may provide an additional and crucial perspective on the evolutionary differences between humans and chimpanzees. To investigate how often expression differences seen in tissues are caused by sequence differences in the proximal promoters, we tested the expression activity in cultured cells of human and chimpanzee promoters from genes that differ in mRNA expression between human and chimpanzee tissues. RESULTS: Twelve promoters for which the corresponding gene had been shown to be differentially expressed between humans and chimpanzees in liver or brain were tested. Seven showed a significant difference in activity between the human promoter and the orthologous chimpanzee promoter in at least one of the two cell lines used. However, only three of them showed a difference in the same direction as in the tissues. CONCLUSION: Differences in proximal promoter activity are likely to be common between humans and chimpanzees, but are not linked in a simple fashion to gene-expression levels in tissues. This suggests that several genetic differences between humans and chimpanzees might be responsible for a single expression difference and thus that relevant expression differences between humans and chimpanzees will be difficult to predict from cell culture experiments or DNA sequences.</description>
    <dc:title>Functional analysis of human and chimpanzee promoters.</dc:title>

    <dc:creator>F Heissig</dc:creator>
    <dc:creator>J Krause</dc:creator>
    <dc:creator>J Bryk</dc:creator>
    <dc:creator>P Khaitovich</dc:creator>
    <dc:creator>W Enard</dc:creator>
    <dc:creator>S Pääbo</dc:creator>
    <dc:identifier>doi:10.1186/gb-2005-6-7-r57</dc:identifier>
    <dc:source>Genome Biol, Vol. 6, No. 7. (2005)</dc:source>
    <dc:date>2006-07-24T16:58:32-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Genome Biol</prism:publicationName>
    <prism:issn>1465-6914</prism:issn>
    <prism:volume>6</prism:volume>
    <prism:number>7</prism:number>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/166875">
    <title>Multiple-laboratory comparison of microarray platforms</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/166875</link>
    <description>&lt;i&gt;Nature Methods, Vol. 2, No. 5. (21 April 2005), pp. 345-350.&lt;/i&gt;</description>
    <dc:title>Multiple-laboratory comparison of microarray platforms</dc:title>

    <dc:creator>Rafael Irizarry</dc:creator>
    <dc:creator>Daniel Warren</dc:creator>
    <dc:creator>Forrest Spencer</dc:creator>
    <dc:creator>Irene Kim</dc:creator>
    <dc:creator>Shyam Biswal</dc:creator>
    <dc:creator>Bryan Frank</dc:creator>
    <dc:creator>Edward Gabrielson</dc:creator>
    <dc:creator>Joe Garcia</dc:creator>
    <dc:creator>Joel Geoghegan</dc:creator>
    <dc:creator>Gregory Germino</dc:creator>
    <dc:creator>Constance Griffin</dc:creator>
    <dc:creator>Sara Hilmer</dc:creator>
    <dc:creator>Eric Hoffman</dc:creator>
    <dc:creator>Anne Jedlicka</dc:creator>
    <dc:creator>Ernest Kawasaki</dc:creator>
    <dc:creator>Francisco Martínez-Murillo</dc:creator>
    <dc:creator>Laura Morsberger</dc:creator>
    <dc:creator>Hannah Lee</dc:creator>
    <dc:creator>David Petersen</dc:creator>
    <dc:creator>John Quackenbush</dc:creator>
    <dc:creator>Alan Scott</dc:creator>
    <dc:creator>Michael Wilson</dc:creator>
    <dc:creator>Yanqin Yang</dc:creator>
    <dc:creator>Shui Ye</dc:creator>
    <dc:creator>Wayne Yu</dc:creator>
    <dc:identifier>doi:10.1038/nmeth756</dc:identifier>
    <dc:source>Nature Methods, Vol. 2, No. 5. (21 April 2005), pp. 345-350.</dc:source>
    <dc:date>2005-04-22T06:16:46-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Nature Methods</prism:publicationName>
    <prism:issn>1548-7091</prism:issn>
    <prism:volume>2</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>345</prism:startingPage>
    <prism:endingPage>350</prism:endingPage>
    <prism:publisher>Nature Publishing Group</prism:publisher>
    <prism:category>microarrays</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/684573">
    <title>Applied bioinformatics for the identification of regulatory elements.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/684573</link>
    <description>&lt;i&gt;Nat Rev Genet, Vol. 5, No. 4. (April 2004), pp. 276-287.&lt;/i&gt;</description>
    <dc:title>Applied bioinformatics for the identification of regulatory elements.</dc:title>

    <dc:creator>WW Wasserman</dc:creator>
    <dc:creator>A Sandelin</dc:creator>
    <dc:identifier>doi:10.1038/nrg1315</dc:identifier>
    <dc:source>Nat Rev Genet, Vol. 5, No. 4. (April 2004), pp. 276-287.</dc:source>
    <dc:date>2006-06-05T16:25:43-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Nat Rev Genet</prism:publicationName>
    <prism:issn>1471-0056</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>276</prism:startingPage>
    <prism:endingPage>287</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/700992">
    <title>Transcriptome network component analysis with limited microarray data.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/700992</link>
    <description>&lt;i&gt;Bioinformatics (9 June 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Network component analysis (NCA) is a method to deduce transcription factor (TF) activities and TF-gene regulation control strengths from gene expression data and a TF-gene binding connectivity network. Previously, this method could analyze a maximum number of regulators equal to the total sample size because of the identifiability limit in data decomposition. As such, the total number of source signal components was limited to the total number of experiments rather than the total number of biological regulators. However, networks that have less transcriptome data points than the number of regulators are of interest. Thus it is imperative to develop a theoretical basis that allows realistic source signal extraction based on relatively few data points. On the other hand, such methods would inherently increase numerical challenges leading to multiple solutions. Therefore, solutions to both problems are needed. RESULTS: We have improved NCA for transcription factor activity (TFA) estimation, based the observation that most genes are regulated by only a few TFs. This observation leads to the derivation of a new identifiability criterion which is tested during numerical iteration that allows us to decompose data when the number of TFs is greater than the number of experiments. To show that our method works with real microarray data and has biological utility, we analyze Saccharomyces cerevisiae cell cycle microarray data (73 experiments) using a TF-gene connectivity network (96 TFs) derived from ChIP-chip binding data. We compare the results of NCA analysis to results obtained from ChIP-chip regression methods, and we show that NCA and regression produce TFAs that are qualitatively similar, but the NCA TFAs outperform regression in statistical tests. We also show that NCA can extract subtle TFA signals that correlate with known cell cycle TF function and cell cycle phase. Overall we determined that 31 TFs have statistically periodic TFAs in one or more experiments, 75% of which are known cell cycle regulators. In addition we find that the 12 TFAs that are periodic in two or more experiments correspond to well known cell cycle regulators. We also investigated TFA sensitivity to the choice of connectivity network we constructed two networks using different ChIP-chip p-value cut-offs. AVAILABILITY: The NCA Toolbox for MATLAB is available at http://www.seas.ucla.edu/~liaoj/download.htm.</description>
    <dc:title>Transcriptome network component analysis with limited microarray data.</dc:title>

    <dc:creator>Simon J Galbraith</dc:creator>
    <dc:creator>Linh M Tran</dc:creator>
    <dc:creator>James C Liao</dc:creator>
    <dc:source>Bioinformatics (9 June 2006)</dc:source>
    <dc:date>2006-06-19T12:17:58-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Bioinformatics</prism:publicationName>
    <prism:issn>1367-4803</prism:issn>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/915261">
    <title>Stochastic model of transcription factor-regulated gene expression.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/915261</link>
    <description>&lt;i&gt;Phys Biol, Vol. 3, No. 3. (September 2006), pp. 200-208.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We consider a stochastic model of transcription factor (TF)-regulated gene expression. The model describes two genes, gene A and gene B, which synthesize the TFs and the target gene proteins, respectively. We show through analytic calculations that the TF fluctuations have a significant effect on the distribution of the target gene protein levels when the mean TF level falls in the highest sensitive region of the dose-response curve. We further study the effect of reducing the copy number of gene A from two to one. The enhanced TF fluctuations yield results different from those in the deterministic case. The probability that the target gene protein level exceeds a threshold value is calculated with the knowledge of the probability density functions associated with the TF and target gene protein levels. Numerical simulation results for a more detailed stochastic model are shown to be in agreement with those obtained through analytic calculations. The relevance of these results in the context of the genetic disorder haploinsufficiency is pointed out. Some experimental observations on the haploinsufficiency of the tumour suppressor gene, Nkx 3.1, are explained with the help of the stochastic model of TF-regulated gene expression.</description>
    <dc:title>Stochastic model of transcription factor-regulated gene expression.</dc:title>

    <dc:creator>R Karmakar</dc:creator>
    <dc:creator>I Bose</dc:creator>
    <dc:source>Phys Biol, Vol. 3, No. 3. (September 2006), pp. 200-208.</dc:source>
    <dc:date>2006-10-27T14:31:28-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Phys Biol</prism:publicationName>
    <prism:issn>1478-3967</prism:issn>
    <prism:volume>3</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>200</prism:startingPage>
    <prism:endingPage>208</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/1285080">
    <title>The genome of the kinetoplastid parasite, Leishmania major.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/1285080</link>
    <description>&lt;i&gt;Science, Vol. 309, No. 5733. (15 July 2005), pp. 436-442.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Leishmania species cause a spectrum of human diseases in tropical and subtropical regions of the world. We have sequenced the 36 chromosomes of the 32.8-megabase haploid genome of Leishmania major (Friedlin strain) and predict 911 RNA genes, 39 pseudogenes, and 8272 protein-coding genes, of which 36% can be ascribed a putative function. These include genes involved in host-pathogen interactions, such as proteolytic enzymes, and extensive machinery for synthesis of complex surface glycoconjugates. The organization of protein-coding genes into long, strand-specific, polycistronic clusters and lack of general transcription factors in the L. major, Trypanosoma brucei, and Trypanosoma cruzi (Tritryp) genomes suggest that the mechanisms regulating RNA polymerase II-directed transcription are distinct from those operating in other eukaryotes, although the trypanosomatids appear capable of chromatin remodeling. Abundant RNA-binding proteins are encoded in the Tritryp genomes, consistent with active posttranscriptional regulation of gene expression.</description>
    <dc:title>The genome of the kinetoplastid parasite, Leishmania major.</dc:title>

    <dc:creator>AC Ivens</dc:creator>
    <dc:creator>CS Peacock</dc:creator>
    <dc:creator>EA Worthey</dc:creator>
    <dc:creator>L Murphy</dc:creator>
    <dc:creator>G Aggarwal</dc:creator>
    <dc:creator>M Berriman</dc:creator>
    <dc:creator>E Sisk</dc:creator>
    <dc:creator>MA Rajandream</dc:creator>
    <dc:creator>E Adlem</dc:creator>
    <dc:creator>R Aert</dc:creator>
    <dc:creator>A Anupama</dc:creator>
    <dc:creator>Z Apostolou</dc:creator>
    <dc:creator>P Attipoe</dc:creator>
    <dc:creator>N Bason</dc:creator>
    <dc:creator>C Bauser</dc:creator>
    <dc:creator>A Beck</dc:creator>
    <dc:creator>SM Beverley</dc:creator>
    <dc:creator>G Bianchettin</dc:creator>
    <dc:creator>K Borzym</dc:creator>
    <dc:creator>G Bothe</dc:creator>
    <dc:creator>CV Bruschi</dc:creator>
    <dc:creator>M Collins</dc:creator>
    <dc:creator>E Cadag</dc:creator>
    <dc:creator>L Ciarloni</dc:creator>
    <dc:creator>C Clayton</dc:creator>
    <dc:creator>RM Coulson</dc:creator>
    <dc:creator>A Cronin</dc:creator>
    <dc:creator>AK Cruz</dc:creator>
    <dc:creator>RM Davies</dc:creator>
    <dc:creator>J De Gaudenzi</dc:creator>
    <dc:creator>DE Dobson</dc:creator>
    <dc:creator>A Duesterhoeft</dc:creator>
    <dc:creator>G Fazelina</dc:creator>
    <dc:creator>N Fosker</dc:creator>
    <dc:creator>AC Frasch</dc:creator>
    <dc:creator>A Fraser</dc:creator>
    <dc:creator>M Fuchs</dc:creator>
    <dc:creator>C Gabel</dc:creator>
    <dc:creator>A Goble</dc:creator>
    <dc:creator>A Goffeau</dc:creator>
    <dc:creator>D Harris</dc:creator>
    <dc:creator>C Hertz-Fowler</dc:creator>
    <dc:creator>H Hilbert</dc:creator>
    <dc:creator>D Horn</dc:creator>
    <dc:creator>Y Huang</dc:creator>
    <dc:creator>S Klages</dc:creator>
    <dc:creator>A Knights</dc:creator>
    <dc:creator>M Kube</dc:creator>
    <dc:creator>N Larke</dc:creator>
    <dc:creator>L Litvin</dc:creator>
    <dc:creator>A Lord</dc:creator>
    <dc:creator>T Louie</dc:creator>
    <dc:creator>M Marra</dc:creator>
    <dc:creator>D Masuy</dc:creator>
    <dc:creator>K Matthews</dc:creator>
    <dc:creator>S Michaeli</dc:creator>
    <dc:creator>JC Mottram</dc:creator>
    <dc:creator>S Müller-Auer</dc:creator>
    <dc:creator>H Munden</dc:creator>
    <dc:creator>S Nelson</dc:creator>
    <dc:creator>H Norbertczak</dc:creator>
    <dc:creator>K Oliver</dc:creator>
    <dc:creator>S O'neil</dc:creator>
    <dc:creator>M Pentony</dc:creator>
    <dc:creator>TM Pohl</dc:creator>
    <dc:creator>C Price</dc:creator>
    <dc:creator>B Purnelle</dc:creator>
    <dc:creator>MA Quail</dc:creator>
    <dc:creator>E Rabbinowitsch</dc:creator>
    <dc:creator>R Reinhardt</dc:creator>
    <dc:creator>M Rieger</dc:creator>
    <dc:creator>J Rinta</dc:creator>
    <dc:creator>J Robben</dc:creator>
    <dc:creator>L Robertson</dc:creator>
    <dc:creator>JC Ruiz</dc:creator>
    <dc:creator>S Rutter</dc:creator>
    <dc:creator>D Saunders</dc:creator>
    <dc:creator>M Schäfer</dc:creator>
    <dc:creator>J Schein</dc:creator>
    <dc:creator>DC Schwartz</dc:creator>
    <dc:creator>K Seeger</dc:creator>
    <dc:creator>A Seyler</dc:creator>
    <dc:creator>S Sharp</dc:creator>
    <dc:creator>H Shin</dc:creator>
    <dc:creator>D Sivam</dc:creator>
    <dc:creator>R Squares</dc:creator>
    <dc:creator>S Squares</dc:creator>
    <dc:creator>V Tosato</dc:creator>
    <dc:creator>C Vogt</dc:creator>
    <dc:creator>G Volckaert</dc:creator>
    <dc:creator>R Wambutt</dc:creator>
    <dc:creator>T Warren</dc:creator>
    <dc:creator>H Wedler</dc:creator>
    <dc:creator>J Woodward</dc:creator>
    <dc:creator>S Zhou</dc:creator>
    <dc:creator>W Zimmermann</dc:creator>
    <dc:creator>DF Smith</dc:creator>
    <dc:creator>JM Blackwell</dc:creator>
    <dc:creator>KD Stuart</dc:creator>
    <dc:creator>B Barrell</dc:creator>
    <dc:creator>PJ Myler</dc:creator>
    <dc:identifier>doi:10.1126/science.1112680</dc:identifier>
    <dc:source>Science, Vol. 309, No. 5733. (15 July 2005), pp. 436-442.</dc:source>
    <dc:date>2007-05-09T11:29:53-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Science</prism:publicationName>
    <prism:issn>1095-9203</prism:issn>
    <prism:volume>309</prism:volume>
    <prism:number>5733</prism:number>
    <prism:startingPage>436</prism:startingPage>
    <prism:endingPage>442</prism:endingPage>
    <prism:category>leishmaniasis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/1116998">
    <title>How to infer gene networks from expression profiles</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/1116998</link>
    <description>&lt;i&gt;Mol Syst Biol, Vol. 3 (13 February 2007)&lt;/i&gt;</description>
    <dc:title>How to infer gene networks from expression profiles</dc:title>

    <dc:creator>Mukesh Bansal</dc:creator>
    <dc:creator>Vincenzo Belcastro</dc:creator>
    <dc:creator>Alberto Ambesi-Impiombato</dc:creator>
    <dc:creator>Diego di Bernardo</dc:creator>
    <dc:identifier>doi:10.1038/msb4100120</dc:identifier>
    <dc:source>Mol Syst Biol, Vol. 3 (13 February 2007)</dc:source>
    <dc:date>2007-02-21T21:52:28-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Mol Syst Biol</prism:publicationName>
    <prism:volume>3</prism:volume>
    <prism:category>genetic_regulation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/437270">
    <title>Genetic regulation of root hair development in Arabidopsis thaliana: a network model.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/437270</link>
    <description>&lt;i&gt;J Theor Biol, Vol. 204, No. 3. (7 June 2000), pp. 311-326.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The root epidermis of Arabidopsis thaliana is formed by alternate files of hair and non-hair cells. Epidermal cells overlying two cortex cells eventually develop a hair, while those overlying only one cortex cell do not. Here we propose a network model that integrates most of the available genetic and molecular data on the regulatory and signaling pathways underlying root epidermal differentiation. The network architecture includes two pathways; one formed by the genes TTG, R homolog, GL2 and CPC, and the other one by the signal transduction proteins ETR1 and CTR1. Both parallel pathways regulate the activity of AXR2 and RHD6, which in turn control the development of root hairs. The regulatory network was simulated as a dynamical system of eight discrete state variables. The distinction between epidermal cells contacting one or two cortical cells was accounted for by fixing the initial states of CPC and ETR1 proteins. The model allows for predictions of mutants and pharmacological effects because it includes the ethylene receptor. The dynamical system reaches one of the six stable states depending upon the initial state of the CPC variable and the ethylene receptor. Two of the stable states describe the activation patterns observed in mature trichoblasts (hair cells) and atrichoblasts (non-hair cells) in the wild-type phenotype and under normal ethylene availability. The other four states correspond to changes in the number of hair cells due to experimentally induced changes in ethylene availability. This model provides a hypothesis on the interactions among genes that encode transcription factors that regulate root hair development and the proteins involved in the ethylene transduction pathway. This is the first effort to use a dynamical system to understand the complex genetic regulatory interactions that rule Arabidopsis primary root development. The advantages of this type of models over static schematic representations are discussed.</description>
    <dc:title>Genetic regulation of root hair development in Arabidopsis thaliana: a network model.</dc:title>

    <dc:creator>L Mendoza</dc:creator>
    <dc:creator>ER Alvarez-Buylla</dc:creator>
    <dc:identifier>doi:10.1006/jtbi.2000.2014</dc:identifier>
    <dc:source>J Theor Biol, Vol. 204, No. 3. (7 June 2000), pp. 311-326.</dc:source>
    <dc:date>2005-12-14T09:05:45-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publicationName>J Theor Biol</prism:publicationName>
    <prism:issn>0022-5193</prism:issn>
    <prism:volume>204</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>311</prism:startingPage>
    <prism:endingPage>326</prism:endingPage>
    <prism:category>genetic_regulation</prism:category>
    <prism:category>plants</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/238188">
    <title>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/238188</link>
    <description>&lt;i&gt;Nucleic Acids Res, Vol. 25, No. 17. (1 September 1997), pp. 3389-3402.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The BLAST programs are widely used tools for searching protein and DNA databases for sequence similarities. For protein comparisons, a variety of definitional, algorithmic and statistical refinements described here permits the execution time of the BLAST programs to be decreased substantially while enhancing their sensitivity to weak similarities. A new criterion for triggering the extension of word hits, combined with a new heuristic for generating gapped alignments, yields a gapped BLAST program that runs at approximately three times the speed of the original. In addition, a method is introduced for automatically combining statistically significant alignments produced by BLAST into a position-specific score matrix, and searching the database using this matrix. The resulting Position-Specific Iterated BLAST (PSI-BLAST) program runs at approximately the same speed per iteration as gapped BLAST, but in many cases is much more sensitive to weak but biologically relevant sequence similarities. PSI-BLAST is used to uncover several new and interesting members of the BRCT superfamily.</description>
    <dc:title>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</dc:title>

    <dc:creator>SF Altschul</dc:creator>
    <dc:creator>TL Madden</dc:creator>
    <dc:creator>AA Schäffer</dc:creator>
    <dc:creator>J Zhang</dc:creator>
    <dc:creator>Z Zhang</dc:creator>
    <dc:creator>W Miller</dc:creator>
    <dc:creator>DJ Lipman</dc:creator>
    <dc:identifier>doi:10.1093/nar/25.17.3389</dc:identifier>
    <dc:source>Nucleic Acids Res, Vol. 25, No. 17. (1 September 1997), pp. 3389-3402.</dc:source>
    <dc:date>2005-06-26T00:48:58-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:publicationName>Nucleic Acids Res</prism:publicationName>
    <prism:issn>0305-1048</prism:issn>
    <prism:volume>25</prism:volume>
    <prism:number>17</prism:number>
    <prism:startingPage>3389</prism:startingPage>
    <prism:endingPage>3402</prism:endingPage>
    <prism:category>blast</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2369506">
    <title>Bioinformatics challenges of new sequencing technology</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2369506</link>
    <description>&lt;i&gt;Trends in Genetics, Vol. In Press, Corrected Proof&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;New DNA sequencing technologies can sequence up to one billion bases in a single day at low cost, putting large-scale sequencing within the reach of many scientists. Many researchers are forging ahead with projects to sequence a range of species using the new technologies. However, these new technologies produce read lengths as short as 35-40 nucleotides, posing challenges for genome assembly and annotation. Here we review the challenges and describe some of the bioinformatics systems that are being proposed to solve them. We specifically address issues arising from using these technologies in assembly projects, both de novo and for resequencing purposes, as well as efforts to improve genome annotation in the fragmented assemblies produced by short read lengths.</description>
    <dc:title>Bioinformatics challenges of new sequencing technology</dc:title>

    <dc:creator>Mihai Pop</dc:creator>
    <dc:creator>Steven Salzberg</dc:creator>
    <dc:identifier>doi:10.1016/j.tig.2007.12.006</dc:identifier>
    <dc:source>Trends in Genetics, Vol. In Press, Corrected Proof</dc:source>
    <dc:date>2008-02-13T12:33:43-00:00</dc:date>
    <prism:publicationName>Trends in Genetics</prism:publicationName>
    <prism:volume>In Press, Corrected Proof</prism:volume>
    <prism:category>dna_sequencing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2629481">
    <title>CAMERA: A Community Resource for Metagenomics</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2629481</link>
    <description>&lt;i&gt;PLoS Biology, Vol. 5, No. 3. (1 March 2007), e75.&lt;/i&gt;</description>
    <dc:title>CAMERA: A Community Resource for Metagenomics</dc:title>

    <dc:creator>Rekha Seshadri</dc:creator>
    <dc:creator>Saul Kravitz</dc:creator>
    <dc:creator>Larry Smarr</dc:creator>
    <dc:creator>Paul Gilna</dc:creator>
    <dc:creator>Marvin Frazier</dc:creator>
    <dc:identifier>doi:10.1371%2Fjournal.pbio.0050075</dc:identifier>
    <dc:source>PLoS Biology, Vol. 5, No. 3. (1 March 2007), e75.</dc:source>
    <dc:date>2008-04-04T11:55:30-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>PLoS Biology</prism:publicationName>
    <prism:volume>5</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>e75</prism:startingPage>
    <prism:category>genomics_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/1145123">
    <title>Comparative genome assembly.</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/1145123</link>
    <description>&lt;i&gt;Brief Bioinform, Vol. 5, No. 3. (September 2004), pp. 237-248.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;One of the most complex and computationally intensive tasks of genome sequence analysis is genome assembly. Even today, few centres have the resources, in both software and hardware, to assemble a genome from the thousands or millions of individual sequences generated in a whole-genome shotgun sequencing project. With the rapid growth in the number of sequenced genomes has come an increase in the number of organisms for which two or more closely related species have been sequenced. This has created the possibility of building a comparative genome assembly algorithm, which can assemble a newly sequenced genome by mapping it onto a reference genome. We describe here a novel algorithm for comparative genome assembly that can accurately assemble a typical bacterial genome in less than four minutes on a standard desktop computer. The software is available as part of the open-source AMOS project.</description>
    <dc:title>Comparative genome assembly.</dc:title>

    <dc:creator>M Pop</dc:creator>
    <dc:creator>A Phillippy</dc:creator>
    <dc:creator>AL Delcher</dc:creator>
    <dc:creator>SL Salzberg</dc:creator>
    <dc:identifier>doi:10.1093/bib/5.3.237</dc:identifier>
    <dc:source>Brief Bioinform, Vol. 5, No. 3. (September 2004), pp. 237-248.</dc:source>
    <dc:date>2007-03-07T04:40:34-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Brief Bioinform</prism:publicationName>
    <prism:issn>1467-5463</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>237</prism:startingPage>
    <prism:endingPage>248</prism:endingPage>
    <prism:category>genomics_analysis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/mariakmejia/article/2311222">
    <title>Pyrobayes: an improved base caller for SNP discovery in pyrosequences</title>
    <link>http://www.citeulike.org/user/mariakmejia/article/2311222</link>
    <description>&lt;i&gt;Nature Methods, Vol. 5, No. 2. (13 January 2008), pp. 179-181.&lt;/i&gt;</description>
    <dc:title>Pyrobayes: an improved base caller for SNP discovery in pyrosequences</dc:title>

    <dc:creator>Aaron Quinlan</dc:creator>
    <dc:creator>Donald Stewart</dc:creator>
    <dc:creator>Michael Strömberg</dc:creator>
    <dc:creator>Gábor Marth</dc:creator>
    <dc:identifier>doi:10.1038/nmeth.1172</dc:identifier>
    <dc:source>Nature Methods, Vol. 5, No. 2. (13 January 2008), pp. 179-181.</dc:source>
    <dc:date>2008-01-31T11:58:19-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Nature Methods</prism:publicationName>
    <prism:issn>1548-7091</prism:issn>
    <prism:volume>5</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>179</prism:startingPage>
    <prism:endingPage>181</prism:endingPage>
    <prism:publisher>Nature Publishing Group</prism:publisher>
    <prism:category>dna_sequencing</prism:category>
</item>



</rdf:RDF>

