<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sun, 06 Jul 2008 02:04:44 BST</pubDate>


	<title>CiteULike: vlachmore's library [290 articles]</title>
	<description>CiteULike: vlachmore's library [290 articles]</description>


	<link>http://www.citeulike.org/user/vlachmore</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2948859"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/519793"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/531257"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2910900"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2903283"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/531251"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2891300"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2875286"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2861694"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2861514"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2587956"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/510438"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2133755"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2861462"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2805713"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1915444"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2801724"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2587574"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2776008"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2670160"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2775855"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2765621"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2697015"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1185721"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2674017"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2672890"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2658576"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/819622"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2637717"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/113955"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1153421"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1304139"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/590638"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2520315"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2515403"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2515369"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2504970"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1081834"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2491840"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2491574"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2491502"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2491441"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2354608"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/1983303"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/635668"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2465524"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2449590"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2447750"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2447739"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/vlachmore/article/2394375"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2948859">
    <title>Diffusion Kernels on Statistical Manifolds</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2948859</link>
    <description>&lt;i&gt;J. Mach. Learn. Res., Vol. 6 (2005), pp. 129-163.&lt;/i&gt;</description>
    <dc:title>Diffusion Kernels on Statistical Manifolds</dc:title>

    <dc:creator>John Lafferty</dc:creator>
    <dc:creator>Guy Lebanon</dc:creator>
    <dc:source>J. Mach. Learn. Res., Vol. 6 (2005), pp. 129-163.</dc:source>
    <dc:date>2008-07-01T16:53:25-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>J. Mach. Learn. Res.</prism:publicationName>
    <prism:issn>1533-7928</prism:issn>
    <prism:volume>6</prism:volume>
    <prism:startingPage>129</prism:startingPage>
    <prism:endingPage>163</prism:endingPage>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>heat</prism:category>
    <prism:category>kernel</prism:category>
    <prism:category>machines</prism:category>
    <prism:category>support</prism:category>
    <prism:category>svms</prism:category>
    <prism:category>vector</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/519793">
    <title>A variational Bayesian framework for graphical models</title>
    <link>http://www.citeulike.org/user/vlachmore/article/519793</link>
    <description>&lt;i&gt;(2000)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents a novel practical framework for Bayesian model averaging and model selection in probabilistic graphical models. Our approach approximates full posterior distributions over model parameters and structures, as well as latent variables, in an analytical manner. These posteriors fall out of a free-form optimization procedure, which naturally incorporates conjugate priors. Unlike in large sample approximations, the posteriors are generally nonGaussian and no Hessian needs...</description>
    <dc:title>A variational Bayesian framework for graphical models</dc:title>

    <dc:creator>H Attias</dc:creator>
    <dc:source>(2000)</dc:source>
    <dc:date>2006-02-24T14:33:47-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:category>bayesian</prism:category>
    <prism:category>graphical</prism:category>
    <prism:category>models</prism:category>
    <prism:category>variational_inference</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/531257">
    <title>Document clustering based on non-negative matrix factorization</title>
    <link>http://www.citeulike.org/user/vlachmore/article/531257</link>
    <description>&lt;i&gt;(2003), pp. 267-273.&lt;/i&gt;</description>
    <dc:title>Document clustering based on non-negative matrix factorization</dc:title>

    <dc:creator>Wei Xu</dc:creator>
    <dc:creator>Xin Liu</dc:creator>
    <dc:creator>Yihong Gong</dc:creator>
    <dc:identifier>doi:10.1145/860435.860485</dc:identifier>
    <dc:source>(2003), pp. 267-273.</dc:source>
    <dc:date>2006-03-06T08:47:16-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:startingPage>267</prism:startingPage>
    <prism:endingPage>273</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>clustering</prism:category>
    <prism:category>document</prism:category>
    <prism:category>factorization</prism:category>
    <prism:category>matrix</prism:category>
    <prism:category>non-negative</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2910900">
    <title>Technical Introduction: A Primer on Probabilistic Inference</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2910900</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Technical Introduction: A Primer on Probabilistic Inference</dc:title>

    <dc:creator>Thomas Griffiths</dc:creator>
    <dc:creator>Alan Yuille</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2008-06-20T15:59:07-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>inference</prism:category>
    <prism:category>probabilistic</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2903283">
    <title>Projected Gradient Methods for Nonnegative Matrix Factorization</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2903283</link>
    <description>&lt;i&gt;Neural Comp., Vol. 19, No. 10. (1 October 2007), pp. 2756-2779.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Nonnegative matrix factorization (NMF) can be formulated as a minimization problem with bound constraints. Although bound-constrained optimization has been studied extensively in both theory and practice, so far no study has formally applied its techniques to NMF. In this letter, we propose two projected gradient methods for NMF, both of which exhibit strong optimization properties. We discuss efficient implementations and demonstrate that one of the proposed methods converges faster than the popular multiplicative update approach. A simple Matlab code is also provided.</description>
    <dc:title>Projected Gradient Methods for Nonnegative Matrix Factorization</dc:title>

    <dc:creator>Chih-Jen Lin</dc:creator>
    <dc:source>Neural Comp., Vol. 19, No. 10. (1 October 2007), pp. 2756-2779.</dc:source>
    <dc:date>2008-06-17T23:21:40-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Neural Comp.</prism:publicationName>
    <prism:volume>19</prism:volume>
    <prism:number>10</prism:number>
    <prism:startingPage>2756</prism:startingPage>
    <prism:endingPage>2779</prism:endingPage>
    <prism:category>factorization</prism:category>
    <prism:category>matrix</prism:category>
    <prism:category>non-negative</prism:category>
    <prism:category>software</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/531251">
    <title>Algorithms for Non-negative Matrix Factorization</title>
    <link>http://www.citeulike.org/user/vlachmore/article/531251</link>
    <description>&lt;i&gt;(2000), pp. 556-562.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Non-negative matrix factorization (NMF) has previously been shown to be a useful decomposition for multivariate data. Two different multiplicative algorithms for NMF are analyzed. They differ only slightly in the multiplicative factor used in the update rules. One algorithm can be shown to minimize the conventional least squares error while the other minimizes the generalized Kullback-Leibler divergence. The monotonic convergence of both algorithms can be proven using an auxiliary...</description>
    <dc:title>Algorithms for Non-negative Matrix Factorization</dc:title>

    <dc:creator>Daniel Lee</dc:creator>
    <dc:creator>Sebastian Seung</dc:creator>
    <dc:source>(2000), pp. 556-562.</dc:source>
    <dc:date>2006-03-06T06:55:34-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:startingPage>556</prism:startingPage>
    <prism:endingPage>562</prism:endingPage>
    <prism:category>dimensionality</prism:category>
    <prism:category>factorization</prism:category>
    <prism:category>matrix</prism:category>
    <prism:category>non-negative</prism:category>
    <prism:category>reduction</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2891300">
    <title>A generalization of principal component analysis to the exponential family</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2891300</link>
    <description>&lt;i&gt;(2001)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Principal component analysis (PCA) is a commonly applied technique for dimensionality reduction. PCA implicitly minimizes a squared loss function, which may be inappropriate for data that is not real-valued, such as binary-valued data. This paper draws on ideas from the Exponential family, Generalized linear models, and Bregman distances, to give a generalization of PCA to loss functions that we argue are better suited to other data types. We describe algorithms for minimizing the loss...</description>
    <dc:title>A generalization of principal component analysis to the exponential family</dc:title>

    <dc:creator>M Collins</dc:creator>
    <dc:creator>S Dasgupta</dc:creator>
    <dc:creator>R Schapire</dc:creator>
    <dc:source>(2001)</dc:source>
    <dc:date>2008-06-13T12:58:17-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:category>analysis</prism:category>
    <prism:category>component</prism:category>
    <prism:category>dimensionality</prism:category>
    <prism:category>exponential</prism:category>
    <prism:category>pca</prism:category>
    <prism:category>principal</prism:category>
    <prism:category>reduction</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2875286">
    <title>A Bayesian Model for Supervised Clustering with the Dirichlet Process Prior</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2875286</link>
    <description>&lt;i&gt;J. Mach. Learn. Res., Vol. 6 (2005), pp. 1551-1577.&lt;/i&gt;</description>
    <dc:title>A Bayesian Model for Supervised Clustering with the Dirichlet Process Prior</dc:title>

    <dc:creator>Hal Iii</dc:creator>
    <dc:creator>Daniel Marcu</dc:creator>
    <dc:source>J. Mach. Learn. Res., Vol. 6 (2005), pp. 1551-1577.</dc:source>
    <dc:date>2008-06-09T10:49:34-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>J. Mach. Learn. Res.</prism:publicationName>
    <prism:issn>1533-7928</prism:issn>
    <prism:volume>6</prism:volume>
    <prism:startingPage>1551</prism:startingPage>
    <prism:endingPage>1577</prism:endingPage>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>bayesian</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>dirichlet</prism:category>
    <prism:category>non-parametric</prism:category>
    <prism:category>prior</prism:category>
    <prism:category>process</prism:category>
    <prism:category>supervised</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2861694">
    <title>Sufficient Dimensionality Reduction</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2861694</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Dimensionality reduction of empirical co-occurrence data is a fundamental problem in unsupervised learning. It is also a well studied problem in statistics known as the analysis of cross-classified data. One principled approach to this problem is to represent the data in low dimension with minimal loss of (mutual) information contained in the original data. In this paper we introduce an information theoretic nonlinear method for finding such a most informative dimension reduction.</description>
    <dc:title>Sufficient Dimensionality Reduction</dc:title>

    <dc:creator>Amir Globerson</dc:creator>
    <dc:creator>Naftali Tishby</dc:creator>
    <dc:date>2008-06-04T15:57:24-00:00</dc:date>
    <prism:category>dimensionality</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2861514">
    <title>Detecting Stable Clusters Using Principal Component Analysis</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2861514</link>
    <description>&lt;i&gt;Functional Genomics (2003), pp. 159-182.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Clustering is one of the most commonly used tools in the analysis of gene expression data (1,2). The usage in grouping genes is based on the premise that coexpression is a result of coregulation. It is often used as a preliminary step in extracting gene networks and inference of gene function (3,4). Clustering of experiments can be used to discover novel phenotypic aspects of cells and tissues (3,5,6), including sensitivity to drugs (7), and can also detect artifacts of experimental conditions (8). Clustering and its applications in biology are presented in greater detail in Chapter 13 (see also ref. 9). While we focus on gene expression data in this chapter, the methodology presented here is applicable for other types of data as well.</description>
    <dc:title>Detecting Stable Clusters Using Principal Component Analysis</dc:title>

    <dc:creator>Asa Ben-Hur</dc:creator>
    <dc:creator>Isabelle Guyon</dc:creator>
    <dc:identifier>doi:10.1385/1-59259-364-X:159</dc:identifier>
    <dc:source>Functional Genomics (2003), pp. 159-182.</dc:source>
    <dc:date>2008-06-04T15:42:53-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Functional Genomics</prism:publicationName>
    <prism:startingPage>159</prism:startingPage>
    <prism:endingPage>182</prism:endingPage>
    <prism:category>analysis</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>component</prism:category>
    <prism:category>dimensionality</prism:category>
    <prism:category>pca</prism:category>
    <prism:category>principal</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2587956">
    <title>Unsupervised Feature Selection Using Feature Similarity</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2587956</link>
    <description>&lt;i&gt;IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 24, No. 4. (2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this article, we describe an unsupervised feature selection algorithm suitable for data sets, large in both dimension and size. The method is based on measuring similarity between features whereby redundancy therein is removed. This does not need any search and, therefore, is fast. A feature similarity measure, called maximum information compression index, is introduced. The algorithm is generic in nature and has the capability of multiscale representation of data sets. The superiority of...</description>
    <dc:title>Unsupervised Feature Selection Using Feature Similarity</dc:title>

    <dc:creator>P Mitra</dc:creator>
    <dc:creator>CA Murthy</dc:creator>
    <dc:creator>SK Pal</dc:creator>
    <dc:source>IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 24, No. 4. (2002)</dc:source>
    <dc:date>2008-03-26T00:13:20-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>IEEE Transactions on Pattern Analysis and Machine Intelligence</prism:publicationName>
    <prism:volume>24</prism:volume>
    <prism:number>4</prism:number>
    <prism:category>dimensionality</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/510438">
    <title>Variable Selection for Model-Based Clustering</title>
    <link>http://www.citeulike.org/user/vlachmore/article/510438</link>
    <description>&lt;i&gt;Journal of the American Statistical Association, Vol. 101, No. 473. (March 2006), pp. 168-178.&lt;/i&gt;</description>
    <dc:title>Variable Selection for Model-Based Clustering</dc:title>

    <dc:creator>Adrian Raftery</dc:creator>
    <dc:creator>Nema Dean</dc:creator>
    <dc:identifier>doi:10.1198/016214506000000113</dc:identifier>
    <dc:source>Journal of the American Statistical Association, Vol. 101, No. 473. (March 2006), pp. 168-178.</dc:source>
    <dc:date>2006-02-18T14:36:37-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Journal of the American Statistical Association</prism:publicationName>
    <prism:issn>0162-1459</prism:issn>
    <prism:volume>101</prism:volume>
    <prism:number>473</prism:number>
    <prism:startingPage>168</prism:startingPage>
    <prism:endingPage>178</prism:endingPage>
    <prism:publisher>American Statistical Association</prism:publisher>
    <prism:category>clustering</prism:category>
    <prism:category>dimensionality</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2133755">
    <title>Unsupervised Forward Selection: A Method for Eliminating Redundant Variables</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2133755</link>
    <description>&lt;i&gt;J. Chem. Inf. Comput. Sci., Vol. 40, No. 5. (25 September 2000), pp. 1160-1168.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Abstract: An unsupervised learning method is proposed for variable selection and its performance assessed using three typical QSAR data sets. The aims of this procedure are to generate a subset of descriptors from any given data set in which the resultant variables are relevant, redundancy is eliminated, and multicollinearity is reduced. Continuum regression, an algorithm encompassing ordinary least squares regression, regression on principal components, and partial least squares regression, was used to construct models from the selected variables. The variable selection routine is shown to produce simple, robust, and easily interpreted models for the chosen data sets.</description>
    <dc:title>Unsupervised Forward Selection: A Method for Eliminating Redundant Variables</dc:title>

    <dc:creator>DC Whitley</dc:creator>
    <dc:creator>MG Ford</dc:creator>
    <dc:creator>DJ Livingstone</dc:creator>
    <dc:identifier>doi:10.1021/ci000384c</dc:identifier>
    <dc:source>J. Chem. Inf. Comput. Sci., Vol. 40, No. 5. (25 September 2000), pp. 1160-1168.</dc:source>
    <dc:date>2007-12-16T21:40:56-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publicationName>J. Chem. Inf. Comput. Sci.</prism:publicationName>
    <prism:volume>40</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>1160</prism:startingPage>
    <prism:endingPage>1168</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>dimensionality</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2861462">
    <title>CLIFF: Clustering of High-Dimensional Microarray Data via Iterative Feature Filtering Using Normalized Cuts</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2861462</link>
    <description>&lt;i&gt;(2001)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present CLIFF, an algorithm for clustering biological samples using gene expression microarray data. This clustering problem is difficult for several reasons, in particular the sparsity of the data, the high dimensionality of the feature (gene) space, and the fact that many features are irrelevant or redundant. Our algorithm iterates between two computational processes, feature filtering and clustering. Given a reference partition that approximates the correct clustering of the samples, our...</description>
    <dc:title>CLIFF: Clustering of High-Dimensional Microarray Data via Iterative Feature Filtering Using Normalized Cuts</dc:title>

    <dc:creator>Eric Xing</dc:creator>
    <dc:creator>Richard Karp</dc:creator>
    <dc:source>(2001)</dc:source>
    <dc:date>2008-06-04T15:22:31-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:category>clustering</prism:category>
    <prism:category>dimensionality</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>unsupervised</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2805713">
    <title>Church: a language for generative models</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2805713</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Church: a language for generative models</dc:title>

    <dc:creator>Noah Goodman</dc:creator>
    <dc:creator>Vikash Mansinghka</dc:creator>
    <dc:creator>Daniel Roy</dc:creator>
    <dc:creator>Keith Bonawitz</dc:creator>
    <dc:creator>Joshua Tenenbaum</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-05-16T18:44:37-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>church</prism:category>
    <prism:category>generative</prism:category>
    <prism:category>models</prism:category>
    <prism:category>non-parametric</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1915444">
    <title>Incorporating non-local information into information extraction systems by Gibbs sampling</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1915444</link>
    <description>&lt;i&gt;(2005), pp. 363-370.&lt;/i&gt;</description>
    <dc:title>Incorporating non-local information into information extraction systems by Gibbs sampling</dc:title>

    <dc:creator>Jenny Finkel</dc:creator>
    <dc:creator>Trond Grenager</dc:creator>
    <dc:creator>Christopher Manning</dc:creator>
    <dc:identifier>doi:10.3115/1219840.1219885</dc:identifier>
    <dc:source>(2005), pp. 363-370.</dc:source>
    <dc:date>2007-11-14T19:16:28-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:startingPage>363</prism:startingPage>
    <prism:endingPage>370</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>conditional</prism:category>
    <prism:category>crf</prism:category>
    <prism:category>fields</prism:category>
    <prism:category>ner</prism:category>
    <prism:category>random</prism:category>
    <prism:category>skip-chain</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2801724">
    <title>An Introduction to Variable and Feature Selection</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2801724</link>
    <description>&lt;i&gt;Journal of Machine Learning Research, Vol. 3 (March 2003), pp. 1157-1182.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Variable and feature selection have become the focus of much research in areas of application for which datasets with tens or hundreds of thousands of variables are available. These areas include text processing of internet documents, gene expression array analysis, and combinatorial chemistry. The objective of variable selection is three-fold: improving the prediction performance of the predictors, providing faster and more cost-effective predictors, and providing a better understanding of the underlying process that generated the data. The contributions of this special issue cover a wide range of aspects of such problems: providing a better definition of the objective function, feature construction, feature ranking, multivariate feature selection, efficient search methods, and feature validity assessment methods.</description>
    <dc:title>An Introduction to Variable and Feature Selection</dc:title>

    <dc:creator>Isabelle Guyon</dc:creator>
    <dc:creator>André Elisseeff</dc:creator>
    <dc:source>Journal of Machine Learning Research, Vol. 3 (March 2003), pp. 1157-1182.</dc:source>
    <dc:date>2008-05-15T14:24:39-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Journal of Machine Learning Research</prism:publicationName>
    <prism:volume>3</prism:volume>
    <prism:startingPage>1157</prism:startingPage>
    <prism:endingPage>1182</prism:endingPage>
    <prism:category>dimensionality</prism:category>
    <prism:category>feature</prism:category>
    <prism:category>reduction</prism:category>
    <prism:category>selection</prism:category>
    <prism:category>variable</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2587574">
    <title>A Tutorial on Conformal Prediction</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2587574</link>
    <description>&lt;i&gt;Journal of Machine Learning Research, Vol. 9 (March 2008), pp. 371-421.&lt;/i&gt;</description>
    <dc:title>A Tutorial on Conformal Prediction</dc:title>

    <dc:creator>Glenn Shafer</dc:creator>
    <dc:creator>Vladimir Vovk</dc:creator>
    <dc:source>Journal of Machine Learning Research, Vol. 9 (March 2008), pp. 371-421.</dc:source>
    <dc:date>2008-03-25T20:09:52-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Journal of Machine Learning Research</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:startingPage>371</prism:startingPage>
    <prism:endingPage>421</prism:endingPage>
    <prism:category>conformal</prism:category>
    <prism:category>learning</prism:category>
    <prism:category>machine</prism:category>
    <prism:category>on-line</prism:category>
    <prism:category>prediction</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2776008">
    <title>Comparative analysis of five protein-protein interaction corpora</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2776008</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 9, No. Suppl 3. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:Growing interest in the application of natural language processing methods to biomedical text has led to an increasing number of corpora and methods targeting protein-protein interaction (PPI) extraction. However, there is no general consensus regarding PPI annotation and consequently resources are largely incompatible and methods are difficult to evaluate.RESULTS:We present the first comparative evaluation of the diverse PPI corpora, performing quantitative evaluation using two separate information extraction methods as well as detailed statistical and qualitative analyses of their properties. For the evaluation, we unify the corpus PPI annotations to a shared level of information, consisting of undirected, untyped binary interactions of non-static types with no identification of the words specifying the interaction, no negations, and no interaction certainty.We find that the F-score performance of a state-of-the-art PPI extraction method varies on average 19 percentage units and in some cases over 30 percentage units between the different evaluated corpora. The differences stemming from the choice of corpus can thus be substantially larger than differences between the performance of PPI extraction methods, which suggests definite limits on the ability to compare methods evaluated on different resources. We analyse a number of potential sources for these differences and identify factors explaining approximately half of the variance. We further suggest ways in which the difficulty of the PPI extraction tasks codified by different corpora can be determined to advance comparability. Our analysis also identifies points of agreement and disagreement in PPI corpus annotation that are rarely explicitly stated by the authors of the corpora.CONCLUSIONS:Our comparative analysis uncovers key similarities and differences between the diverse PPI corpora, thus taking an important step towards standardization. In the course of this study we have created a major practical contribution in converting the corpora into a shared format. The conversion software is freely available at http://mars.cs.utu.fi/PPICorpora.</description>
    <dc:title>Comparative analysis of five protein-protein interaction corpora</dc:title>

    <dc:creator>Sampo Pyysalo</dc:creator>
    <dc:creator>Antti Airola</dc:creator>
    <dc:creator>Juho Heimonen</dc:creator>
    <dc:creator>Jari Bjorne</dc:creator>
    <dc:creator>Filip Ginter</dc:creator>
    <dc:creator>Tapio Salakoski</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S6</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 9, No. Suppl 3. (2008)</dc:source>
    <dc:date>2008-05-09T14:34:10-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>Suppl 3</prism:number>
    <prism:category>bionlp</prism:category>
    <prism:category>interaction</prism:category>
    <prism:category>protein-protein</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2670160">
    <title>Normalizing biomedical terms by minimizing ambiguity and variability</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2670160</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 9, No. Suppl 3. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:One of the difficulties in mapping biomedical named entities, e.g. genes, proteins, chemicals and diseases, to their concept identifiers stems from the potential variability of the terms. Soft string matching is a possible solution to the problem, but its inherent heavy computational cost discourages its use when the dictionaries are large or when real time processing is required. A less computationally demanding approach is to normalize the terms by using heuristic rules, which enables us to look up a dictionary in a constant time regardless of its size. The development of good heuristic rules, however, requires extensive knowledge of the terminology in question and thus is the bottleneck of the normalization approach.RESULTS:We present a novel framework for discovering a list of normalization rules from a dictionary in a fully automated manner. The rules are discovered in such a way that they minimize the ambiguity and variability of the terms in the dictionary. We evaluated our algorithm using two large dictionaries: a human gene/protein name dictionary built from BioThesaurus and a disease name dictionary built from UMLS.CONCLUSIONS:The experimental results showed that automatically discovered rules can perform comparably to carefully crafted heuristic rules in term mapping tasks, and the computational overhead of rule application is small enough that a very fast implementation is possible. This work will help improve the performance of term-concept mapping tasks in biomedical information extraction especially when good normalization heuristics for the target terminology are not fully known.</description>
    <dc:title>Normalizing biomedical terms by minimizing ambiguity and variability</dc:title>

    <dc:creator>Yoshimasa Tsuruoka</dc:creator>
    <dc:creator>John Mcnaught</dc:creator>
    <dc:creator>Sophia Ananiadou</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-S3-S2</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 9, No. Suppl 3. (2008)</dc:source>
    <dc:date>2008-04-14T17:56:30-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>Suppl 3</prism:number>
    <prism:category>bionlp</prism:category>
    <prism:category>gene</prism:category>
    <prism:category>normalization</prism:category>
    <prism:category>rules</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2775855">
    <title>BANNER: an executable survey of advances in biomedical named entity recognition.</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2775855</link>
    <description>&lt;i&gt;Pacific Symposium on Biocomputing. Pacific Symposium on Biocomputing (2008), pp. 652-663.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;There has been an increasing amount of research on biomedical named entity recognition, the most basic text extraction problem, resulting in significant progress by different research teams around the world. This has created a need for a freely-available, open source system implementing the advances described in the literature. In this paper we present BANNER, an open-source, executable survey of advances in biomedical named entity recognition, intended to serve as a benchmark for the field. BANNER is implemented in Java as a machine-learning system based on conditional random fields and includes a wide survey of the best techniques recently described in the literature. It is designed to maximize domain independence by not employing brittle semantic features or rule-based processing steps, and achieves significantly better performance than existing baseline systems. It is therefore useful to developers as an extensible NER implementation, to researchers as a standard for comparing innovative techniques, and to biologists requiring the ability to find novel entities in large amounts of text.</description>
    <dc:title>BANNER: an executable survey of advances in biomedical named entity recognition.</dc:title>

    <dc:creator>R Leaman</dc:creator>
    <dc:creator>G Gonzalez</dc:creator>
    <dc:source>Pacific Symposium on Biocomputing. Pacific Symposium on Biocomputing (2008), pp. 652-663.</dc:source>
    <dc:date>2008-05-09T13:25:09-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Pacific Symposium on Biocomputing. Pacific Symposium on Biocomputing</prism:publicationName>
    <prism:issn>1793-5091</prism:issn>
    <prism:startingPage>652</prism:startingPage>
    <prism:endingPage>663</prism:endingPage>
    <prism:category>bionlp</prism:category>
    <prism:category>crf</prism:category>
    <prism:category>entity</prism:category>
    <prism:category>gene</prism:category>
    <prism:category>name</prism:category>
    <prism:category>named</prism:category>
    <prism:category>ner</prism:category>
    <prism:category>recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2765621">
    <title>Unsupervised Learning of Narrative Event Chains</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2765621</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Unsupervised Learning of Narrative Event Chains</dc:title>

    <dc:creator>Nathanael Chambers</dc:creator>
    <dc:creator>Dan Jurafsky</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-05-07T12:14:02-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>learning</prism:category>
    <prism:category>unsupervised</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2697015">
    <title>Semi-Supervised Learning</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2697015</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Semi-Supervised Learning</dc:title>

    <dc:source>(2006)</dc:source>
    <dc:date>2008-04-21T16:04:15-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>learning</prism:category>
    <prism:category>machine</prism:category>
    <prism:category>semi-supervised</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1185721">
    <title>Corrective feedback and persistent learning for information extraction</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1185721</link>
    <description>&lt;i&gt;Artif. Intell., Vol. 170, No. 14. (October 2006), pp. 1101-1122.&lt;/i&gt;</description>
    <dc:title>Corrective feedback and persistent learning for information extraction</dc:title>

    <dc:creator>Aron Culotta</dc:creator>
    <dc:creator>Trausti Kristjansson</dc:creator>
    <dc:creator>Andrew Mccallum</dc:creator>
    <dc:creator>Paul Viola</dc:creator>
    <dc:identifier>doi:10.1016/j.artint.2006.08.001</dc:identifier>
    <dc:source>Artif. Intell., Vol. 170, No. 14. (October 2006), pp. 1101-1122.</dc:source>
    <dc:date>2007-03-25T01:13:08-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Artif. Intell.</prism:publicationName>
    <prism:issn>0004-3702</prism:issn>
    <prism:volume>170</prism:volume>
    <prism:number>14</prism:number>
    <prism:startingPage>1101</prism:startingPage>
    <prism:endingPage>1122</prism:endingPage>
    <prism:publisher>Elsevier Science Publishers Ltd.</prism:publisher>
    <prism:category>conditional</prism:category>
    <prism:category>extraction</prism:category>
    <prism:category>feedback</prism:category>
    <prism:category>fields</prism:category>
    <prism:category>information</prism:category>
    <prism:category>random</prism:category>
    <prism:category>user</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2674017">
    <title>Toward conditional models of identity uncertainty with application to proper noun coreference</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2674017</link>
    <description>&lt;i&gt;(2003)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Coreference analysis, also known as record linkage or identity uncertainty, is a difficult and important problem in natural language processing, databases, citation matching and many other tasks. This paper introduces several discriminative, conditionalprobability models for coreference analysis, all examples of undirected graphical models. Unlike many historical approaches to coreference, the models presented here are relational---they do not assume that pairwise coreference decisions ...</description>
    <dc:title>Toward conditional models of identity uncertainty with application to proper noun coreference</dc:title>

    <dc:creator>A Mccallum</dc:creator>
    <dc:creator>B Wellner</dc:creator>
    <dc:source>(2003)</dc:source>
    <dc:date>2008-04-15T16:38:49-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:category>conditional</prism:category>
    <prism:category>coreference</prism:category>
    <prism:category>fields</prism:category>
    <prism:category>noun</prism:category>
    <prism:category>proper</prism:category>
    <prism:category>random</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2672890">
    <title>Natural Language Processing in aid of FlyBase curators</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2672890</link>
    <description>&lt;i&gt;BMC Bioinformatics, Vol. 9, No. 1. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;BACKGROUND:Despite increasing interest in applying Natural Language Processing (NLP) to biomedical text, whether this technology can facilitate tasks such as database curation remains unclear.RESULTS:PaperBrowser is the first NLP-powered interface that was developed under a user-centered approach to improve the way in which FlyBase curators navigate an article. In this paper, we first discuss how observing curators at work informed the design and evaluation of PaperBrowser. Then, we present how we appraise PaperBrowser's navigational functionalities in a user-based study using a text highlighting task and evaluation criteria of Human-Computer Interaction. Our results show that PaperBrowser reduces the amount of interactions between two highlighting events and therefore improves navigational efficiency by about 58% compared to the navigational mechanism that was previously available to the curators. Moreover, PaperBrowser is shown to provide curators with enhanced navigational utility by over 74% irrespective of the different ways in which they highlight text in the article.CONCLUSIONS:We show that state-of-the-art performance in certain NLP tasks such as Named Entity Recognition and Anaphora Resolution can be combined with the navigational functionalities of PaperBrowser to support curation quite successfully.</description>
    <dc:title>Natural Language Processing in aid of FlyBase curators</dc:title>

    <dc:creator>Nikiforos Karamanis</dc:creator>
    <dc:creator>Ruth Seal</dc:creator>
    <dc:creator>Ian Lewin</dc:creator>
    <dc:creator>Peter Mcquilton</dc:creator>
    <dc:creator>Andreas Vlachos</dc:creator>
    <dc:creator>Caroline Gasperin</dc:creator>
    <dc:creator>Rachel Drysdale</dc:creator>
    <dc:creator>Ted Briscoe</dc:creator>
    <dc:identifier>doi:10.1186/1471-2105-9-193</dc:identifier>
    <dc:source>BMC Bioinformatics, Vol. 9, No. 1. (2008)</dc:source>
    <dc:date>2008-04-15T11:11:07-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>BMC Bioinformatics</prism:publicationName>
    <prism:volume>9</prism:volume>
    <prism:number>1</prism:number>
    <prism:category>bionlp</prism:category>
    <prism:category>curation</prism:category>
    <prism:category>flyslip</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2658576">
    <title>Semi-Automated Named Entity Annotation</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2658576</link>
    <description>&lt;i&gt;(June 2007), pp. 53-56.&lt;/i&gt;</description>
    <dc:title>Semi-Automated Named Entity Annotation</dc:title>

    <dc:creator>Kuzman Ganchev</dc:creator>
    <dc:creator>Fernando Pereira</dc:creator>
    <dc:creator>Mark Mandel</dc:creator>
    <dc:creator>Steven Carroll</dc:creator>
    <dc:creator>Peter White</dc:creator>
    <dc:source>(June 2007), pp. 53-56.</dc:source>
    <dc:date>2008-04-11T18:23:31-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>53</prism:startingPage>
    <prism:endingPage>56</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>annotation</prism:category>
    <prism:category>cost</prism:category>
    <prism:category>entity</prism:category>
    <prism:category>experiments</prism:category>
    <prism:category>mira</prism:category>
    <prism:category>named</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>timed</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/819622">
    <title>Constructing biological knowledge-bases by extracting information from text sources</title>
    <link>http://www.citeulike.org/user/vlachmore/article/819622</link>
    <description>&lt;i&gt;(1999), pp. 77-86.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Recently, there has been much effort in making databases for molecular biology more accessible and interoperable. However, information in text form, such as MEDLINE records, remains a greatly underutilized source of biological information. We have begun a research effort aimed at automatically mapping information from text sources into structured representations, such as knowledge bases. Our approach to this task is to use machine-learning methods to induce routines for extracting facts from...</description>
    <dc:title>Constructing biological knowledge-bases by extracting information from text sources</dc:title>

    <dc:creator>M Craven</dc:creator>
    <dc:creator>J Kumlien</dc:creator>
    <dc:source>(1999), pp. 77-86.</dc:source>
    <dc:date>2006-08-28T08:52:56-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:startingPage>77</prism:startingPage>
    <prism:endingPage>86</prism:endingPage>
    <prism:category>bionlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2637717">
    <title>Verb Class Discovery from Rich Syntactic Data</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2637717</link>
    <description>&lt;i&gt;Computational Linguistics and Intelligent Text Processing (2008), pp. 16-27.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Previous research has shown that syntactic features are the most informative features in automatic verb classification. We investigate their optimal characteristics by comparing a range of feature sets extracted from data where the proportion of verbal arguments and adjuncts is controlled. The data are obtained from different versions of valex [1] – a large scf lexicon for English which was acquired automatically from several corpora and the Web. We evaluate the feature sets thoroughly using four supervised classifiers and one unsupervised method. The best performing feature set includes rich syntactic information about both arguments and adjuncts of verbs. When combined with our best performing classifier (a novel Gaussian classifier), it yields the promising accuracy of 64.2% in classifying 204 verbs to 17 Levin (1993) classes. We discuss the impact of our results on the state-or-art and propose avenues for future work.</description>
    <dc:title>Verb Class Discovery from Rich Syntactic Data</dc:title>

    <dc:creator>Lin Sun</dc:creator>
    <dc:creator>Anna Korhonen</dc:creator>
    <dc:creator>Yuval Krymolowski</dc:creator>
    <dc:identifier>doi:10.1007/978-3-540-78135-6_2</dc:identifier>
    <dc:source>Computational Linguistics and Intelligent Text Processing (2008), pp. 16-27.</dc:source>
    <dc:date>2008-04-07T13:16:29-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Computational Linguistics and Intelligent Text Processing</prism:publicationName>
    <prism:startingPage>16</prism:startingPage>
    <prism:endingPage>27</prism:endingPage>
    <prism:category>classifier</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>frames</prism:category>
    <prism:category>gaussian</prism:category>
    <prism:category>semantic</prism:category>
    <prism:category>subcategorization</prism:category>
    <prism:category>verb</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/113955">
    <title>WordNet: An Electronic Lexical Database (Language, Speech, and Communication)</title>
    <link>http://www.citeulike.org/user/vlachmore/article/113955</link>
    <description>&lt;i&gt;(15 May 1998)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;with a preface by George Miller &#60;P&#62;WordNet, an electronic lexical database, is considered to be the most important resource available to researchers in computational linguistics, text analysis, and many related areas. Its design is inspired by current psycholinguistic and computational theories of human lexical memory. English nouns, verbs, adjectives, and adverbs are organized into synonym sets, each representing one underlying lexicalized concept. Different relations link the synonym sets. &#60;P&#62;The purpose of this volume is twofold. First, it discusses the design of WordNet and the theoretical motivations behind it. Second, it provides a survey of representative applications, including word sense identification, information retrieval, selectional preferences of verbs, and lexical chains. &#60;P&#62;Contributors: Reem Al-Halimi, Robert C. Berwick, J. F. M. Burg, Martin Chodorow, Christiane Fellbaum, Joachim Grabowski, Sanda Harabagiu, Marti A. Hearst, Graeme Hirst, Douglas A. Jones, Rick Kazman, Karen T. Kohl, Shari Landes, Claudia Leacock, George A. Miller, Katherine J. Miller, Dan Moldovan, Naoyuki Nomura, Uta Priss, Philip Resnik, David St-Onge, Randee Tengi, Reind P. van de Riet, Ellen Voorhees.</description>
    <dc:title>WordNet: An Electronic Lexical Database (Language, Speech, and Communication)</dc:title>

    <dc:source>(15 May 1998)</dc:source>
    <dc:date>2005-03-04T15:24:02-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:publisher>The MIT Press</prism:publisher>
    <prism:category>wordnet</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1153421">
    <title>WordNet: a lexical database for English</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1153421</link>
    <description>&lt;i&gt;Commun. ACM, Vol. 38, No. 11. (November 1995), pp. 39-41.&lt;/i&gt;</description>
    <dc:title>WordNet: a lexical database for English</dc:title>

    <dc:creator>George Miller</dc:creator>
    <dc:identifier>doi:10.1145/219717.219748</dc:identifier>
    <dc:source>Commun. ACM, Vol. 38, No. 11. (November 1995), pp. 39-41.</dc:source>
    <dc:date>2007-03-11T06:40:46-00:00</dc:date>
    <prism:publicationYear>1995</prism:publicationYear>
    <prism:publicationName>Commun. ACM</prism:publicationName>
    <prism:issn>0001-0782</prism:issn>
    <prism:volume>38</prism:volume>
    <prism:number>11</prism:number>
    <prism:startingPage>39</prism:startingPage>
    <prism:endingPage>41</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>wordnet</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1304139">
    <title>Objective criteria for the evaluation of clustering methods</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1304139</link>
    <description>&lt;i&gt;Journal of the American Statistical Association, Vol. 66 (1971), pp. 622-626.&lt;/i&gt;</description>
    <dc:title>Objective criteria for the evaluation of clustering methods</dc:title>

    <dc:creator>Wwilliam Rand</dc:creator>
    <dc:identifier>doi:10.2307/2284239</dc:identifier>
    <dc:source>Journal of the American Statistical Association, Vol. 66 (1971), pp. 622-626.</dc:source>
    <dc:date>2007-05-17T19:24:25-00:00</dc:date>
    <prism:publicationYear>1971</prism:publicationYear>
    <prism:publicationName>Journal of the American Statistical Association</prism:publicationName>
    <prism:volume>66</prism:volume>
    <prism:startingPage>622</prism:startingPage>
    <prism:endingPage>626</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>evaluation</prism:category>
    <prism:category>index</prism:category>
    <prism:category>rand</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/590638">
    <title>Interpolating between Types and Tokens by Estimating Power-Law Generators</title>
    <link>http://www.citeulike.org/user/vlachmore/article/590638</link>
    <description>&lt;i&gt;Advances in Neural Information Processing Systems, Vol. 18 (2006)&lt;/i&gt;</description>
    <dc:title>Interpolating between Types and Tokens by Estimating Power-Law Generators</dc:title>

    <dc:creator>Sharon Goldwater</dc:creator>
    <dc:creator>Thomas Griffiths</dc:creator>
    <dc:creator>Mark Johnson</dc:creator>
    <dc:source>Advances in Neural Information Processing Systems, Vol. 18 (2006)</dc:source>
    <dc:date>2006-04-18T17:41:00-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Advances in Neural Information Processing Systems</prism:publicationName>
    <prism:volume>18</prism:volume>
    <prism:category>bayesian</prism:category>
    <prism:category>non-parametric</prism:category>
    <prism:category>pitman</prism:category>
    <prism:category>yor</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2520315">
    <title>A large-scale classification of English verbs</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2520315</link>
    <description>&lt;i&gt;Language Resources and Evaluation&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Abstract&#160;&#160;Lexical classifications have proved useful in supporting various natural language processing (NLP) tasks. The largest verb classification for English is Levin’s (1993) work which defines groupings of verbs based on syntactic and semantic properties. VerbNet (VN) (Kipper et&#160;al. 2000; Kipper-Schuler 2005)—an extensive computational verb lexicon for English—provides detailed syntactic-semantic descriptions of Levin classes. While the classes included are extensive enough for some NLP use, they are not comprehensive. Korhonen and Briscoe (2004) have proposed a significant extension of Levin’s classification which incorporates 57 novel classes for verbs not covered (comprehensively) by Levin. Korhonen and Ryant (unpublished) have recently proposed another extension including 53 additional classes. This article describes the integration of these two extensions into VN. The result is a comprehensive Levin-style classification for English verbs providing over 90% token coverage of the Proposition Bank data (Palmer et&#160;al. 2005) and thus can be highly useful for practical applications.</description>
    <dc:title>A large-scale classification of English verbs</dc:title>

    <dc:creator>Karin Kipper</dc:creator>
    <dc:creator>Anna Korhonen</dc:creator>
    <dc:creator>Neville Ryant</dc:creator>
    <dc:creator>Martha Palmer</dc:creator>
    <dc:identifier>doi:10.1007/s10579-007-9048-2</dc:identifier>
    <dc:source>Language Resources and Evaluation</dc:source>
    <dc:date>2008-03-12T13:47:21-00:00</dc:date>
    <prism:publicationName>Language Resources and Evaluation</prism:publicationName>
    <prism:category>classification</prism:category>
    <prism:category>semantic</prism:category>
    <prism:category>verb</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2515403">
    <title>Fast search for Dirichlet process mixture models</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2515403</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Fast search for Dirichlet process mixture models</dc:title>

    <dc:creator>Hal Daume</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-03-11T15:49:06-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>dirichlet</prism:category>
    <prism:category>mixture</prism:category>
    <prism:category>models</prism:category>
    <prism:category>multinomials</prism:category>
    <prism:category>process</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2515369">
    <title>Identification of MCMC Samples for Clustering</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2515369</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Identification of MCMC Samples for Clustering</dc:title>

    <dc:creator>Kenichi Kurihara</dc:creator>
    <dc:creator>Tsuyoshi Murata</dc:creator>
    <dc:creator>Taisuke Sato</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-03-11T15:42:00-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>average</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>mcmc</prism:category>
    <prism:category>spectral</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2504970">
    <title>Randomized Algorithms for Fast Bayesian Hierarchical Clustering</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2504970</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present two new algorithms for fast Bayesian Hierarchical Clustering on large data sets. Bayesian Hierarchical Clustering (BHC) [1] is a method for agglomerative hierarchical clustering based on evaluating marginal likelihoods of a probabilistic model. BHC has several advantages over traditional distancebased agglomerative clustering algorithms. It defines a probabilistic model of the data and uses Bayesian hypothesis testing to decide which merges are advantageous and to output the...</description>
    <dc:title>Randomized Algorithms for Fast Bayesian Hierarchical Clustering</dc:title>

    <dc:creator>Katherine Heller</dc:creator>
    <dc:creator>Zoubin Ghahramani</dc:creator>
    <dc:date>2008-03-11T00:09:42-00:00</dc:date>
    <prism:category>bayesian</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>hierarchical</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1081834">
    <title>The Comlex Syntax Project</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1081834</link>
    <description>&lt;i&gt;(1994), pp. 300-302.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe the design of Comlex Syntax, a computational lexicon providing detailed syntactic information for approximately 38,000 English headwords. We consider the types of errors which arise in creating such a lexicon, and how such errors can be measured and controlled. 1 Goal The goal of the Comlex Syntax project is to create a moderately-broad-coverage lexicon recording the syntactic features of English words for purposes of computational language analysis. This dictionary is being...</description>
    <dc:title>The Comlex Syntax Project</dc:title>

    <dc:creator>R Grishman</dc:creator>
    <dc:creator>C Macleod</dc:creator>
    <dc:creator>S Wolff</dc:creator>
    <dc:source>(1994), pp. 300-302.</dc:source>
    <dc:date>2007-02-01T09:48:24-00:00</dc:date>
    <prism:publicationYear>1994</prism:publicationYear>
    <prism:startingPage>300</prism:startingPage>
    <prism:endingPage>302</prism:endingPage>
    <prism:category>comlex</prism:category>
    <prism:category>lexicon</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2491840">
    <title>Automatic Extraction of Subcategorization from Corpora</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2491840</link>
    <description>&lt;i&gt;(1997)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe a novel technique and implemented system for constructing a subcategorization dictionary from textual corpora. Each dictionary entry encodes the relative frequency of occurrence of a comprehensive set of subcategorization classes for English. An initial experiment, on a sample of 14 verbs which exhibit multiple complementation patterns, demonstrates that the technique achieves accuracy comparable to previous approaches, which are all limited to a highly restricted set of...</description>
    <dc:title>Automatic Extraction of Subcategorization from Corpora</dc:title>

    <dc:creator>T Briscoe</dc:creator>
    <dc:creator>J Carroll</dc:creator>
    <dc:source>(1997)</dc:source>
    <dc:date>2008-03-09T02:14:49-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:category>frame</prism:category>
    <prism:category>parsing</prism:category>
    <prism:category>rasp</prism:category>
    <prism:category>subcategorization</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2491574">
    <title>Using a probabilistic class-based lexicon for lexical ambiguity resolution</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2491574</link>
    <description>&lt;i&gt;(2000)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents the use of probabilistic class-based lexica for disambiguation in target-word selection. Our method employs minimal but precise contextual information for disambiguation. That is, only information provided by the target-verb, enriched by the condensed information of a probabilistic class-based lexicon, is used. Induction of classes and fine-tuning to verbal arguments is done in an unsupervised manner by EM-based clustering techniques. The method shows promising results in an ...</description>
    <dc:title>Using a probabilistic class-based lexicon for lexical ambiguity resolution</dc:title>

    <dc:creator>D Prescher</dc:creator>
    <dc:creator>S Riezler</dc:creator>
    <dc:creator>M Rooth</dc:creator>
    <dc:source>(2000)</dc:source>
    <dc:date>2008-03-09T00:47:14-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:category>amibguity</prism:category>
    <prism:category>disambiguation</prism:category>
    <prism:category>resolution</prism:category>
    <prism:category>sense</prism:category>
    <prism:category>word</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2491502">
    <title>Spectral Clustering for German Verbs</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2491502</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe and evaluate the application of a spectral clustering technique (Ng et al., 2002) to the unsupervised clustering of German verbs. Previous work has shown that standard clustering techniques succeed in inducing semantic classes from purely syntactic verb subcategorisation information. But little is known about the behaviour of these techniques when applied to high-dimensional natural language data that probably violate the usual normal assumptions. Spectral clustering performs a...</description>
    <dc:title>Spectral Clustering for German Verbs</dc:title>

    <dc:creator>Chris Brew</dc:creator>
    <dc:creator>Sabine</dc:creator>
    <dc:date>2008-03-09T00:18:09-00:00</dc:date>
    <prism:category>clustering</prism:category>
    <prism:category>german</prism:category>
    <prism:category>semantic</prism:category>
    <prism:category>spectral</prism:category>
    <prism:category>spectral_clustering</prism:category>
    <prism:category>verb</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2491441">
    <title>Clustering polysemic subcategorization frame distributions semantically</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2491441</link>
    <description>&lt;i&gt;(2003)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Previous research has demonstrated the utility of clustering in inducing semantic verb classes from undisambiguated corpus data. We describe a new approach which involves clustering subcategorization frame (SCF) distributions using the Information Bottleneck and nearest neighbour methods. In contrast to previous work, we particularly focus on clustering polysemic verbs. A novel evaluation scheme is proposed which accounts for the effect of polysemy on the clusters, offering us a...</description>
    <dc:title>Clustering polysemic subcategorization frame distributions semantically</dc:title>

    <dc:creator>A Korhonen</dc:creator>
    <dc:creator>Y Krymolowski</dc:creator>
    <dc:creator>Z Marx</dc:creator>
    <dc:source>(2003)</dc:source>
    <dc:date>2008-03-08T23:46:47-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:category>clustering</prism:category>
    <prism:category>frames</prism:category>
    <prism:category>polysemous</prism:category>
    <prism:category>semantic</prism:category>
    <prism:category>subcategorization</prism:category>
    <prism:category>verb</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2354608">
    <title>All of Nonparametric Statistics (Springer Texts in Statistics)</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2354608</link>
    <description>&lt;i&gt;(22 May 2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;&#60;P&#62;The goal of this text is to provide the reader with a single book where they can find a brief account of many, modern topics in nonparametric inference. The book is aimed at Master's level or Ph.D. level students in statistics, computer science, and engineering. It is also suitable for researchers who want to get up to speed quickly on modern nonparametric methods.&#60;/P&#62; &#60;P&#62;This text covers a wide range of topics including: the bootstrap, the nonparametric delta method, nonparametric regression, density estimation, orthogonal function methods, minimax estimation, nonparametric confidence sets, and wavelets. The book has a mixture of methods and theory.&#60;/P&#62; &#60;P&#62;From the reviews:&#60;/P&#62; &#60;P&#62;&#34;...The book is excellent.&#34; (Short Book Reviews of the ISI, June 2006)&#60;/P&#62; &#60;P&#62;&#34;Now we have All of Nonparametric Statistics . the writing is excellent and the author is to be congratulated on the clarity achieved. the book is excellent.&#34; (N.R. Draper, Short Book Reviews, Vol. 26 (1), 2006)&#60;/P&#62; &#60;P&#62;&#34;Overall, I enjoyed reading this book very much. I like Wasserman's intuitive explanations and careful insights into why one path or approach is taken over another. Most of all, I am impressed with the wealth of information on the subject of asymptotic nonparametric inferences.&#34; (Stergios B. Fotopoulos for Technometrics, Vol. 49, No. 1., February 2007)&#60;/P&#62;</description>
    <dc:title>All of Nonparametric Statistics (Springer Texts in Statistics)</dc:title>

    <dc:creator>Larry Wasserman</dc:creator>
    <dc:source>(22 May 2007)</dc:source>
    <dc:date>2008-02-08T19:48:04-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publisher>Springer</prism:publisher>
    <prism:category>bayesian</prism:category>
    <prism:category>non-parametric</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/1983303">
    <title>A Nonparametric Bayesian Approach to Modeling Overlapping Clusters</title>
    <link>http://www.citeulike.org/user/vlachmore/article/1983303</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>A Nonparametric Bayesian Approach to Modeling Overlapping Clusters</dc:title>

    <dc:creator>KA Heller</dc:creator>
    <dc:creator>Z Ghahramani</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2007-11-26T03:17:47-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>buffet</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>ibp</prism:category>
    <prism:category>indian</prism:category>
    <prism:category>mixture</prism:category>
    <prism:category>model</prism:category>
    <prism:category>overlap</prism:category>
    <prism:category>process</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/635668">
    <title>Sharing Clusters among Related Groups: Hierarchical Dirichlet Processes</title>
    <link>http://www.citeulike.org/user/vlachmore/article/635668</link>
    <description>&lt;i&gt;Advances in Neural Information Processing Systems 17 (2005), pp. 1385-1392.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We consider problems involving groups of data, where each observation within a group is a draw from a mixture model, and where it is desirable to share mixture components between groups. We assume that the number of mixture components is unknown a priori and is to be inferred from the data. In this setting it is natural to consider sets of Dirichlet processes, one for each group, where the well-known clustering property of the Dirichlet process provides a nonparametric prior for the number of mixture components within each group. Given our desire to tie the mixture models in the various groups, we consider a hierarchical model, specifically one in which the base measure for the child Dirichlet processes is itself distributed according to a Dirichlet process. Such a base measure being discrete, the child Dirichlet processes necessarily share atoms. Thus, as desired, the mixture models in the different groups necessarily share mixture components. We discuss representations of hierarchical Dirichlet processes in terms of a stick-breaking process, and a generalization of the Chinese restaurant process that we refer to as the “Chinese restaurant franchise.” We present Markov chain Monte Carlo algorithms for posterior inference in hierarchical Dirichlet process mixtures, and describe applications to problems in information retrieval and text modelling.</description>
    <dc:title>Sharing Clusters among Related Groups: Hierarchical Dirichlet Processes</dc:title>

    <dc:creator>Yee Teh</dc:creator>
    <dc:creator>Michael Jordan</dc:creator>
    <dc:creator>Matthew Beal</dc:creator>
    <dc:creator>David Blei</dc:creator>
    <dc:source>Advances in Neural Information Processing Systems 17 (2005), pp. 1385-1392.</dc:source>
    <dc:date>2006-05-15T13:16:25-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Advances in Neural Information Processing Systems 17</prism:publicationName>
    <prism:startingPage>1385</prism:startingPage>
    <prism:endingPage>1392</prism:endingPage>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>bayesian</prism:category>
    <prism:category>clustering</prism:category>
    <prism:category>dirichlet</prism:category>
    <prism:category>hierarchical</prism:category>
    <prism:category>process</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2465524">
    <title>How many clusters?</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2465524</link>
    <description>&lt;i&gt;Bayesian Analysis, Vol. 3, No. 1. (2008), pp. 101-120.&lt;/i&gt;</description>
    <dc:title>How many clusters?</dc:title>

    <dc:creator>Peter Mccullagh</dc:creator>
    <dc:creator>J Yang</dc:creator>
    <dc:source>Bayesian Analysis, Vol. 3, No. 1. (2008), pp. 101-120.</dc:source>
    <dc:date>2008-03-04T16:33:05-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Bayesian Analysis</prism:publicationName>
    <prism:volume>3</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>101</prism:startingPage>
    <prism:endingPage>120</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>dirichlet</prism:category>
    <prism:category>process</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2449590">
    <title>Maximum Likelihood and the Information Bottleneck</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2449590</link>
    <description>&lt;i&gt;(2003)&lt;/i&gt;</description>
    <dc:title>Maximum Likelihood and the Information Bottleneck</dc:title>

    <dc:creator>N Slonim</dc:creator>
    <dc:creator>Y Weiss</dc:creator>
    <dc:source>(2003)</dc:source>
    <dc:date>2008-02-29T23:20:32-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:category>bottleneck</prism:category>
    <prism:category>information</prism:category>
    <prism:category>likelihood</prism:category>
    <prism:category>maximum</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2447750">
    <title>Multiple Kernel Learning for Speaker Verification</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2447750</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Multiple Kernel Learning for Speaker Verification</dc:title>

    <dc:creator>Chris Longworth</dc:creator>
    <dc:creator>Mark Gales</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-02-29T14:02:00-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>combination</prism:category>
    <prism:category>kernel</prism:category>
    <prism:category>machines</prism:category>
    <prism:category>speech</prism:category>
    <prism:category>support</prism:category>
    <prism:category>svms</prism:category>
    <prism:category>vector</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2447739">
    <title>Derivative and Parametric Kernels for Speaker Verification</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2447739</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Derivative and Parametric Kernels for Speaker Verification</dc:title>

    <dc:creator>Chris Longworth</dc:creator>
    <dc:creator>Mark Gales</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-02-29T13:56:52-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>combination</prism:category>
    <prism:category>kernels</prism:category>
    <prism:category>machines</prism:category>
    <prism:category>speech</prism:category>
    <prism:category>support</prism:category>
    <prism:category>svms</prism:category>
    <prism:category>vector</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/vlachmore/article/2394375">
    <title>An Information-Theoretic External Cluster-Validity Measure</title>
    <link>http://www.citeulike.org/user/vlachmore/article/2394375</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we propose a measure of similarity/association between two partitions of a set of objects. Our motivation is the desire to use the measure to characterize the quality or accuracy of clustering algorithms by somehow comparing the clusters they produce with &#34;ground truth&#34; consisting of classes assigned to the patterns by manual means or some other means in whose veracity there is confidence. Such measures are referred to as &#34;external&#34;. Our measure also allows clusterings with...</description>
    <dc:title>An Information-Theoretic External Cluster-Validity Measure</dc:title>

    <dc:creator>B Dom</dc:creator>
    <dc:date>2008-02-18T13:45:39-00:00</dc:date>
    <prism:category>clustering</prism:category>
    <prism:category>evaluation</prism:category>
</item>



</rdf:RDF>

