<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Thu, 07 Aug 2008 21:53:43 BST</pubDate>


	<title>CiteULike: briordan's machine-learning</title>
	<description>CiteULike: briordan's machine-learning</description>


	<link>http://www.citeulike.org/user/briordan/tag/machine-learning</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2927808"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2899719"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2873816"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2860212"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2854511"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2853489"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/1823831"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2842511"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2835425"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2817924"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2811430"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2796096"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2796093"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2796089"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2631432"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2624700"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/1245563"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2553392"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2537928"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2537904"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2537897"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2537891"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2462930"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2462923"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2362997"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2355325"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2321812"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/312476"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2198867"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2192875"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2192865"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2186656"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2186649"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2186645"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2186641"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2186636"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2178376"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2069894"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2134463"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/1940101"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2126067"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2113835"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2113349"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2113337"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/2101496"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/1770144"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/briordan/article/1711091"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/briordan/article/2927808">
    <title>Robustly Estimating the Flow Direction of Information in Complex Physical Systems</title>
    <link>http://www.citeulike.org/user/briordan/article/2927808</link>
    <description>&lt;i&gt;Physical Review Letters, Vol. 100, No. 23. (2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We propose a new measure (phase-slope index) to estimate the direction of information flux in multivariate time series. This measure (a)&#160;is insensitive to mixtures of independent sources, (b)&#160;gives meaningful results even if the phase spectrum is not linear, and (c)&#160;properly weights contributions from different frequencies. These properties are shown in extended simulations and contrasted to Granger causality which yields highly significant false detections for mixtures of independent sources. An application to electroencephalography data (eyes-closed condition) reveals a clear front-to-back information flow.</description>
    <dc:title>Robustly Estimating the Flow Direction of Information in Complex Physical Systems</dc:title>

    <dc:creator>Guido Nolte</dc:creator>
    <dc:creator>Andreas Ziehe</dc:creator>
    <dc:creator>Vadim Nikulin</dc:creator>
    <dc:creator>Alois Schl&#246;gl</dc:creator>
    <dc:creator>Nicole Kr&#228;mer</dc:creator>
    <dc:creator>Tom Brismar</dc:creator>
    <dc:creator>Klaus M&#252;ller</dc:creator>
    <dc:identifier>doi:10.1103/PhysRevLett.100.234101</dc:identifier>
    <dc:source>Physical Review Letters, Vol. 100, No. 23. (2008)</dc:source>
    <dc:date>2008-06-26T00:26:34-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Physical Review Letters</prism:publicationName>
    <prism:volume>100</prism:volume>
    <prism:number>23</prism:number>
    <prism:publisher>APS</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>methods</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2899719">
    <title>Mathematical foundations behind Latent Semantic Analysis</title>
    <link>http://www.citeulike.org/user/briordan/article/2899719</link>
    <description>&lt;i&gt;(2007), pp. 35-55.&lt;/i&gt;</description>
    <dc:title>Mathematical foundations behind Latent Semantic Analysis</dc:title>

    <dc:creator>Dian Martin</dc:creator>
    <dc:creator>Michael Berry</dc:creator>
    <dc:source>(2007), pp. 35-55.</dc:source>
    <dc:date>2008-06-16T20:06:37-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>35</prism:startingPage>
    <prism:endingPage>55</prism:endingPage>
    <prism:publisher>Lawrence Erlbaum Associates</prism:publisher>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>lsa</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>models</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2873816">
    <title>An Efficient, Probabilistically Sound Algorithm for Segmentation and Word Discovery</title>
    <link>http://www.citeulike.org/user/briordan/article/2873816</link>
    <description>&lt;i&gt;Machine Learning, Vol. 34, No. 1. (1 February 1999), pp. 71-105.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents a model-based, unsupervised algorithm for recovering word boundaries in a natural-language text from which they have been deleted. The algorithm is derived from a probability model of the source that generated the text. The fundamental structure of the model is specified abstractly so that the detailed component models of phonology, word-order, and word frequency can be replaced in a modular fashion. The model yields a language-independent, prior probability distribution on all possible sequences of all possible words over a given alphabet, based on the assumption that the input was generated by concatenating words from a fixed but unknown lexicon. The model is unusual in that it treats the generation of a complete corpus, regardless of length, as a single event in the probability space. Accordingly, the algorithm does not estimate a probability distribution on words; instead, it attempts to calculate the prior probabilities of various word sequences that could underlie the observed text. Experiments on phonemic transcripts of spontaneous speech by parents to young children suggest that our algorithm is more effective than other proposed algorithms, at least when utterance boundaries are given and the text includes a substantial number of short utterances.</description>
    <dc:title>An Efficient, Probabilistically Sound Algorithm for Segmentation and Word Discovery</dc:title>

    <dc:creator>Michael Brent</dc:creator>
    <dc:identifier>doi:10.1023/A:1007541817488</dc:identifier>
    <dc:source>Machine Learning, Vol. 34, No. 1. (1 February 1999), pp. 71-105.</dc:source>
    <dc:date>2008-06-08T18:10:36-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publicationName>Machine Learning</prism:publicationName>
    <prism:volume>34</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>71</prism:startingPage>
    <prism:endingPage>105</prism:endingPage>
    <prism:category>bayesian</prism:category>
    <prism:category>cross-situational</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>models</prism:category>
    <prism:category>statistical-learning</prism:category>
    <prism:category>word-meaning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2860212">
    <title>Bayesian Nonparametric Modeling and Data Analysis: An Introduction</title>
    <link>http://www.citeulike.org/user/briordan/article/2860212</link>
    <description>&lt;i&gt;(2005)&lt;/i&gt;</description>
    <dc:title>Bayesian Nonparametric Modeling and Data Analysis: An Introduction</dc:title>

    <dc:creator>Timothy Hanson</dc:creator>
    <dc:creator>Adam Branscum</dc:creator>
    <dc:creator>Wesley Johnson</dc:creator>
    <dc:source>(2005)</dc:source>
    <dc:date>2008-06-04T02:45:54-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publisher>Elsevier</prism:publisher>
    <prism:category>bayesian</prism:category>
    <prism:category>handbook</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>textbook</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2854511">
    <title>Towards effective document clustering: A constrained K-means based approach</title>
    <link>http://www.citeulike.org/user/briordan/article/2854511</link>
    <description>&lt;i&gt;Information Processing &#38; Management, Vol. 44, No. 4. (July 2008), pp. 1397-1409.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Document clustering is an important tool for document collection organization and browsing. In real applications, some limited knowledge about cluster membership of a small number of documents is often available, such as some pairs of documents belonging to the same cluster. This kind of prior knowledge can be served as constraints for the clustering process. We integrate the constraints into the trace formulation of the sum of square Euclidean distance function of K-means. Then,the combined criterion function is transformed into trace maximization, which is further optimized by eigen-decomposition. Our experimental evaluation shows that the proposed semi-supervised clustering method can achieve better performance, compared to three existing methods.</description>
    <dc:title>Towards effective document clustering: A constrained K-means based approach</dc:title>

    <dc:creator>Guobiao Hu</dc:creator>
    <dc:creator>Shuigeng Zhou</dc:creator>
    <dc:creator>Jihong Guan</dc:creator>
    <dc:creator>Xiaohua Hu</dc:creator>
    <dc:identifier>doi:10.1016/j.ipm.2008.03.001</dc:identifier>
    <dc:source>Information Processing &#38; Management, Vol. 44, No. 4. (July 2008), pp. 1397-1409.</dc:source>
    <dc:date>2008-06-01T11:34:38-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Information Processing &#38; Management</prism:publicationName>
    <prism:volume>44</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>1397</prism:startingPage>
    <prism:endingPage>1409</prism:endingPage>
    <prism:category>clustering</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2853489">
    <title>A Nonparametric Bayesian Approach to Modeling Overlapping Clusters</title>
    <link>http://www.citeulike.org/user/briordan/article/2853489</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>A Nonparametric Bayesian Approach to Modeling Overlapping Clusters</dc:title>

    <dc:creator>KA Heller</dc:creator>
    <dc:creator>Z Ghahramani</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-05-31T17:43:44-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/1823831">
    <title>Very sparse random projections</title>
    <link>http://www.citeulike.org/user/briordan/article/1823831</link>
    <description>&lt;i&gt;(2006), pp. 287-296.&lt;/i&gt;</description>
    <dc:title>Very sparse random projections</dc:title>

    <dc:creator>Ping Li</dc:creator>
    <dc:creator>Trevor Hastie</dc:creator>
    <dc:creator>Kenneth Church</dc:creator>
    <dc:identifier>doi:10.1145/1150402.1150436</dc:identifier>
    <dc:source>(2006), pp. 287-296.</dc:source>
    <dc:date>2007-10-26T06:10:14-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>287</prism:startingPage>
    <prism:endingPage>296</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2842511">
    <title>Evaluation of Hierarchical Clustering Algorithms for Document Datasets</title>
    <link>http://www.citeulike.org/user/briordan/article/2842511</link>
    <description>&lt;i&gt;(2002), pp. 515-524.&lt;/i&gt;</description>
    <dc:title>Evaluation of Hierarchical Clustering Algorithms for Document Datasets</dc:title>

    <dc:creator>Ying Zhao</dc:creator>
    <dc:creator>George Karypis</dc:creator>
    <dc:source>(2002), pp. 515-524.</dc:source>
    <dc:date>2008-05-28T18:47:20-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:startingPage>515</prism:startingPage>
    <prism:endingPage>524</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2835425">
    <title>Derivative dynamic time warping</title>
    <link>http://www.citeulike.org/user/briordan/article/2835425</link>
    <description>&lt;i&gt;(2001)&lt;/i&gt;</description>
    <dc:title>Derivative dynamic time warping</dc:title>

    <dc:creator>Eamonn Keogh</dc:creator>
    <dc:creator>Michael Pazzani</dc:creator>
    <dc:source>(2001)</dc:source>
    <dc:date>2008-05-26T18:35:45-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2817924">
    <title>Wavelet Methods in Statistics with R</title>
    <link>http://www.citeulike.org/user/briordan/article/2817924</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Wavelet Methods in Statistics with R</dc:title>

    <dc:creator>GP Nason</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-05-20T23:01:13-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publisher>Springer</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>textbook</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2811430">
    <title>Discovering Knowledge in Data: An Introduction to Data Mining</title>
    <link>http://www.citeulike.org/user/briordan/article/2811430</link>
    <description>&lt;i&gt;(2005)&lt;/i&gt;</description>
    <dc:title>Discovering Knowledge in Data: An Introduction to Data Mining</dc:title>

    <dc:creator>Daniel Larose</dc:creator>
    <dc:source>(2005)</dc:source>
    <dc:date>2008-05-19T02:01:24-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publisher>Wiley</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>textbook</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2796096">
    <title>Multimodal Semantic-Associative Collateral Labelling and Indexing of Still Images</title>
    <link>http://www.citeulike.org/user/briordan/article/2796096</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Multimodal Semantic-Associative Collateral Labelling and Indexing of Still Images</dc:title>

    <dc:creator>Meng Zhu</dc:creator>
    <dc:creator>A Badii</dc:creator>
    <dc:date>2008-05-13T20:51:05-00:00</dc:date>
    <prism:category>machine-learning</prism:category>
    <prism:category>multimodal-processing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2796093">
    <title>Automated vocabulary acquisition and interpretation in multimodal conversational systems</title>
    <link>http://www.citeulike.org/user/briordan/article/2796093</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Automated vocabulary acquisition and interpretation in multimodal conversational systems</dc:title>

    <dc:creator>Yi Liu</dc:creator>
    <dc:creator>Joyce Chai</dc:creator>
    <dc:creator>Rong Jin</dc:creator>
    <dc:date>2008-05-13T20:47:17-00:00</dc:date>
    <prism:category>machine-learning</prism:category>
    <prism:category>multimodal-processing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2796089">
    <title>A multimodal learning interface for word acquistion</title>
    <link>http://www.citeulike.org/user/briordan/article/2796089</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>A multimodal learning interface for word acquistion</dc:title>

    <dc:creator>Dana Ballard</dc:creator>
    <dc:creator>Chen Yu</dc:creator>
    <dc:date>2008-05-13T20:44:56-00:00</dc:date>
    <prism:category>machine-learning</prism:category>
    <prism:category>multimodal-processing</prism:category>
    <prism:category>word-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2631432">
    <title>Generalization and similarity in exemplar models of categorization: Insights from machine learning</title>
    <link>http://www.citeulike.org/user/briordan/article/2631432</link>
    <description>&lt;i&gt;Psychonomic Bulletin &#38; Review, Vol. 15, No. 2. (April 2008), pp. 256-271.&lt;/i&gt;</description>
    <dc:title>Generalization and similarity in exemplar models of categorization: Insights from machine learning</dc:title>

    <dc:creator>Jakel</dc:creator>
    <dc:creator>Frank</dc:creator>
    <dc:creator>Scholkopf</dc:creator>
    <dc:creator>Bernhard</dc:creator>
    <dc:creator>Wichmann</dc:creator>
    <dc:creator>A Felix</dc:creator>
    <dc:identifier>doi:10.3758/PBR.15.2.256</dc:identifier>
    <dc:source>Psychonomic Bulletin &#38; Review, Vol. 15, No. 2. (April 2008), pp. 256-271.</dc:source>
    <dc:date>2008-04-05T05:38:09-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Psychonomic Bulletin &#38; Review</prism:publicationName>
    <prism:issn>1069-9384</prism:issn>
    <prism:volume>15</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>256</prism:startingPage>
    <prism:endingPage>271</prism:endingPage>
    <prism:publisher>Psychonomic Society Publications</prism:publisher>
    <prism:category>category-learning</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2624700">
    <title>Text Clustering with Feature Selection by Using Statistical Data</title>
    <link>http://www.citeulike.org/user/briordan/article/2624700</link>
    <description>&lt;i&gt;Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 5. (2008), pp. 641-652.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Feature selection is an important method for improving the efficiency and accuracy of text categorization algorithms by removing redundant and irrelevant terms from the corpus. In this paper, we propose a new supervised feature selection method, named CHIR, which is based on the Chi-square statistic and new statistical data that can measure the positive term-category dependency. We also propose a new text clustering algorithm TCFS, which stands for Text Clustering with Feature Selection. TCFS can incorporate CHIR to identify relevant features (i.e., terms) iteratively, and the clustering becomes a learning process. We compared TCFS and the k-means clustering algorithm in combination with different feature selection methods for various real data sets. Our experimental results show that TCFS with CHIR has better clustering accuracy in terms of the F-measure and the purity.</description>
    <dc:title>Text Clustering with Feature Selection by Using Statistical Data</dc:title>

    <dc:creator>Yanjun Li</dc:creator>
    <dc:creator>Congnan Luo</dc:creator>
    <dc:creator>Soon Chung</dc:creator>
    <dc:identifier>doi:10.1109/TKDE.2007.190740</dc:identifier>
    <dc:source>Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 5. (2008), pp. 641-652.</dc:source>
    <dc:date>2008-04-03T00:25:55-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Knowledge and Data Engineering, IEEE Transactions on</prism:publicationName>
    <prism:volume>20</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>641</prism:startingPage>
    <prism:endingPage>652</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/1245563">
    <title>Discovering Significant Patterns</title>
    <link>http://www.citeulike.org/user/briordan/article/1245563</link>
    <description>&lt;i&gt;Machine Learning&lt;/i&gt;</description>
    <dc:title>Discovering Significant Patterns</dc:title>

    <dc:creator>Geoffrey Webb</dc:creator>
    <dc:identifier>doi:10.1007/s10994-007-5006-x</dc:identifier>
    <dc:source>Machine Learning</dc:source>
    <dc:date>2007-04-23T14:19:19-00:00</dc:date>
    <prism:publicationName>Machine Learning</prism:publicationName>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2553392">
    <title>The Text Mining Handbook: Advanced Approaches to Analyzing Unstructured Data</title>
    <link>http://www.citeulike.org/user/briordan/article/2553392</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>The Text Mining Handbook: Advanced Approaches to Analyzing Unstructured Data</dc:title>

    <dc:creator>Ronen Feldman</dc:creator>
    <dc:creator>James Sanger</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-03-19T00:45:51-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publisher>Cambridge University Press</prism:publisher>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>textbook</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2537928">
    <title>Hierarchical learning strategy in semantic relation extraction</title>
    <link>http://www.citeulike.org/user/briordan/article/2537928</link>
    <description>&lt;i&gt;Information Processing &#38; Management, Vol. 44, No. 3. (May 2008), pp. 1008-1021.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper proposes a novel hierarchical learning strategy to deal with the data sparseness problem in semantic relation extraction by modeling the commonality among related classes. For each class in the hierarchy either manually predefined or automatically clustered, a discriminative function is determined in a top-down way. As the upper-level class normally has much more positive training examples than the lower-level class, the corresponding discriminative function can be determined more reliably and guide the discriminative function learning in the lower-level one more effectively, which otherwise might suffer from limited training data. In this paper, two classifier learning approaches, i.e. the simple perceptron algorithm and the state-of-the-art Support Vector Machines, are applied using the hierarchical learning strategy. Moreover, several kinds of class hierarchies either manually predefined or automatically clustered are explored and compared. Evaluation on the ACE RDC 2003 and 2004 corpora shows that the hierarchical learning strategy much improves the performance on least- and medium-frequent relations.</description>
    <dc:title>Hierarchical learning strategy in semantic relation extraction</dc:title>

    <dc:creator>Guodong Zhou</dc:creator>
    <dc:creator>Min Zhang</dc:creator>
    <dc:creator>Donghong Ji</dc:creator>
    <dc:creator>Qiaoming Zhu</dc:creator>
    <dc:identifier>doi:10.1016/j.ipm.2007.07.007</dc:identifier>
    <dc:source>Information Processing &#38; Management, Vol. 44, No. 3. (May 2008), pp. 1008-1021.</dc:source>
    <dc:date>2008-03-15T22:13:04-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Information Processing &#38; Management</prism:publicationName>
    <prism:volume>44</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>1008</prism:startingPage>
    <prism:endingPage>1021</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2537904">
    <title>Modeling a flexible representation machinery of human concept learning</title>
    <link>http://www.citeulike.org/user/briordan/article/2537904</link>
    <description>&lt;i&gt;Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 289-302.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;It is widely acknowledged that categorically organized abstract knowledge plays a significant role in high-order human cognition. Yet, there are many unknown issues about the nature of how categories are internally represented in our mind. Traditionally, it has been considered that there is a single innate internal representation system for categorical knowledge, such as Exemplars, Prototypes, or Rules. However, results of recent empirical and computational studies collectively suggest that the human internal representation system is apparently capable of exhibiting behaviors consistent with various types of internal representation schemes. We, then, hypothesized that humans' representational system as a dynamic mechanism, capable of selecting a representation scheme that meets situational characteristics, including complexities of category structure. The present paper introduces a framework for a cognitive model that integrates robust and flexible internal representation machinery. Three simulation studies were conducted. The results showed that SUPERSET, our new model, successfully exhibited cognitive behaviors that are consistent with three main theories of the human internal representation system. Furthermore, a simulation study on social cognitive behaviors showed that the model was capable of acquiring knowledge with high commonality, even for a category structure with numerous valid conceptualizations.</description>
    <dc:title>Modeling a flexible representation machinery of human concept learning</dc:title>

    <dc:creator>Toshihiko Matsuka</dc:creator>
    <dc:creator>Yasuaki Sakamoto</dc:creator>
    <dc:creator>Arieta Chouchourelou</dc:creator>
    <dc:identifier>doi:10.1016/j.neunet.2007.12.035</dc:identifier>
    <dc:source>Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 289-302.</dc:source>
    <dc:date>2008-03-15T21:58:12-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Neural Networks</prism:publicationName>
    <prism:volume>21</prism:volume>
    <prism:number>2-3</prism:number>
    <prism:startingPage>289</prism:startingPage>
    <prism:endingPage>302</prism:endingPage>
    <prism:category>machine-learning</prism:category>
    <prism:category>models</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2537897">
    <title>How language can help discrimination in the Neural Modelling Fields framework</title>
    <link>http://www.citeulike.org/user/briordan/article/2537897</link>
    <description>&lt;i&gt;Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 250-256.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The relationship between thought and language and, in particular, the issue of whether and how language influences thought is still a matter of fierce debate. Here we consider a discrimination task scenario to study language acquisition in which an agent receives linguistic input from an external teacher, in addition to sensory stimuli from the objects that exemplify the overlapping categories that make up the environment. Sensory and linguistic input signals are fused using the Neural Modelling Fields (NMF) categorization algorithm. We find that the agent with language is capable of differentiating object features that it could not distinguish without language. In this sense, the linguistic stimuli prompt the agent to redefine and refine the discrimination capacity of its sensory channels.</description>
    <dc:title>How language can help discrimination in the Neural Modelling Fields framework</dc:title>

    <dc:creator>Jose Fontanari</dc:creator>
    <dc:creator>Leonid Perlovsky</dc:creator>
    <dc:identifier>doi:10.1016/j.neunet.2007.12.007</dc:identifier>
    <dc:source>Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 250-256.</dc:source>
    <dc:date>2008-03-15T21:53:30-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Neural Networks</prism:publicationName>
    <prism:volume>21</prism:volume>
    <prism:number>2-3</prism:number>
    <prism:startingPage>250</prism:startingPage>
    <prism:endingPage>256</prism:endingPage>
    <prism:category>linguistic-relativity</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2537891">
    <title>On multidimensional scaling and the embedding of self-organising maps</title>
    <link>http://www.citeulike.org/user/briordan/article/2537891</link>
    <description>&lt;i&gt;Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 160-169.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The self-organising map (SOM) and its variant, visualisation induced SOM (ViSOM), have been known to yield similar results to multidimensional scaling (MDS). However, the exact connection has not been established. In this paper, a review on the SOM and its cost function and topological measures is provided first. We then examine the exact scaling effect of the SOM and ViSOM from their objective functions. The SOM is shown to produce a qualitative, nonmetric scaling, while the local distance-preserving ViSOM produces a quantitative or metric scaling. Their relationship with the principal manifold is also discussed. The SOM-based methods not only produce topological or metric scaling but also provide a principal manifold. Furthermore a growing ViSOM is proposed to aid the adaptive embedding of highly nonlinear manifolds. Examples and comparisons with other embedding methods such as Isomap and local linear embedding are also presented.</description>
    <dc:title>On multidimensional scaling and the embedding of self-organising maps</dc:title>

    <dc:creator>Hujun Yin</dc:creator>
    <dc:identifier>doi:10.1016/j.neunet.2007.12.027</dc:identifier>
    <dc:source>Neural Networks, Vol. 21, No. 2-3. ( 2008), pp. 160-169.</dc:source>
    <dc:date>2008-03-15T21:47:29-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Neural Networks</prism:publicationName>
    <prism:volume>21</prism:volume>
    <prism:number>2-3</prism:number>
    <prism:startingPage>160</prism:startingPage>
    <prism:endingPage>169</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2462930">
    <title>Clustering of Count Data Using Generalized Dirichlet Multinomial Distributions</title>
    <link>http://www.citeulike.org/user/briordan/article/2462930</link>
    <description>&lt;i&gt;Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 4. (2008), pp. 462-474.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we examine the problem of count data clustering. We analyze this problem using finite mixtures of distributions. The multinomial and the multinomial Dirichlet distributions are widely accepted to model count data. We show that these two distributions cannot be the best choice in all the applications and we propose another model called the multinomial generalized Dirichlet distribution (MGDD) that is the composition of the generalized Dirichlet distribution and the multinomial, in the same way that the multinomial Dirichlet distribution (MDD) is the composition of the Dirichlet and the multinomial. The estimation of the parameters and the determination of the number of components in our model are based on the deterministic annealing expectation-maximization (DAEM) approach and the minimum description length (MDL) criterion, respectively. We compare our method to standard approaches such as multinomial and multinomial Dirichlet mixtures to show its merits. The comparison involves different applications such as spatial color image databases indexing, handwritten digit recognition, and text documents clustering.</description>
    <dc:title>Clustering of Count Data Using Generalized Dirichlet Multinomial Distributions</dc:title>

    <dc:creator>Nizar Bouguila</dc:creator>
    <dc:identifier>doi:10.1109/TKDE.2007.190726</dc:identifier>
    <dc:source>Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 4. (2008), pp. 462-474.</dc:source>
    <dc:date>2008-03-04T02:56:59-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Knowledge and Data Engineering, IEEE Transactions on</prism:publicationName>
    <prism:volume>20</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>462</prism:startingPage>
    <prism:endingPage>474</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2462923">
    <title>A Study of the Neighborhood Counting Similarity</title>
    <link>http://www.citeulike.org/user/briordan/article/2462923</link>
    <description>&lt;i&gt;Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 4. (2008), pp. 449-461.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A novel similarity, neighborhood counting measure, was recently proposed which counts the number of neighborhoods of a pair of data points. This similarity can handle numerical and categorical attributes in a conceptually uniform way, can be calculated efficiently through a simple formula, and gives good performance when tested in the framework of k-nearest neighbor classifier. In particular it consistently outperforms a combination of the classical Euclidean distance and Hamming distance. This measure was also shown to be related to a probability formalism, G probability, which is induced from a target probability function P. It was however unclear how G is related to P, especially for classification. Therefore it was not possible to explain some characteristic features of the neighborhood counting measure. In this paper we show that G is a linear function of P, and G-based Bayes classification is equivalent to P-based Bayes classification. We also show that the k-nearest neighbor classifier, when weighted by the neighborhood counting measure, is in fact an approximation of the G-based Bayes classifier, and furthermore, the P-based Bayes classifier. Additionally we show that the neighborhood counting measure remains unchanged when binary attributes are treated as categorical or numerical data. This is a feature that is not shared by other distance measures, to the best of our knowledge. This study provides a theoretical insight into the neighborhood counting measure.</description>
    <dc:title>A Study of the Neighborhood Counting Similarity</dc:title>

    <dc:creator>Hui Wang</dc:creator>
    <dc:creator>Fionn Murtagh</dc:creator>
    <dc:identifier>doi:10.1109/TKDE.2007.190721</dc:identifier>
    <dc:source>Knowledge and Data Engineering, IEEE Transactions on, Vol. 20, No. 4. (2008), pp. 449-461.</dc:source>
    <dc:date>2008-03-04T02:54:53-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Knowledge and Data Engineering, IEEE Transactions on</prism:publicationName>
    <prism:volume>20</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>449</prism:startingPage>
    <prism:endingPage>461</prism:endingPage>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2362997">
    <title>Connectionism, controllers and a brain theory</title>
    <link>http://www.citeulike.org/user/briordan/article/2362997</link>
    <description>&lt;i&gt;IEEE Transactions on Systems, Man and Cybernetics, Part A (to appear)&lt;/i&gt;</description>
    <dc:title>Connectionism, controllers and a brain theory</dc:title>

    <dc:creator>Roy Asim</dc:creator>
    <dc:source>IEEE Transactions on Systems, Man and Cybernetics, Part A (to appear)</dc:source>
    <dc:date>2008-02-11T14:12:25-00:00</dc:date>
    <prism:publicationName>IEEE Transactions on Systems, Man and Cybernetics, Part A</prism:publicationName>
    <prism:category>general-psycholinguistics</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2355325">
    <title>Response to Comment on &#34;Clustering by Passing Messages Between Data Points&#34;</title>
    <link>http://www.citeulike.org/user/briordan/article/2355325</link>
    <description>&lt;i&gt;Science, Vol. 319, No. 5864. (8 February 2008), 726d.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Affinity propagation (AP) can be viewed as a generalization of the vertex substitution heuristic (VSH), whereby probabilistic exemplar substitutions are performed concurrently. Although results on small data sets ([&#8804;]900 points) demonstrate that VSH is competitive with AP, we found VSH to be prohibitively slow for moderate-to-large problems, whereas AP was much faster and could achieve lower error. 10.1126/science.1151268</description>
    <dc:title>Response to Comment on &#34;Clustering by Passing Messages Between Data Points&#34;</dc:title>

    <dc:creator>Brendan Frey</dc:creator>
    <dc:creator>Delbert Dueck</dc:creator>
    <dc:identifier>doi:10.1126/science.1151268</dc:identifier>
    <dc:source>Science, Vol. 319, No. 5864. (8 February 2008), 726d.</dc:source>
    <dc:date>2008-02-09T01:30:51-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Science</prism:publicationName>
    <prism:volume>319</prism:volume>
    <prism:number>5864</prism:number>
    <prism:startingPage>726d</prism:startingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2321812">
    <title>Machine learning: a review of classification and combining techniques</title>
    <link>http://www.citeulike.org/user/briordan/article/2321812</link>
    <description>&lt;i&gt;Artificial Intelligence Review, Vol. 26, No. 3. (November 2006), pp. 159-190.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Abstract&#160;&#160;Supervised classification is one of the tasks most frequently carried out by so-called Intelligent Systems. Thus, a large number of techniques have been developed based on Artificial Intelligence (Logic-based techniques, Perceptron-based techniques) and Statistics (Bayesian Networks, Instance-based techniques). The goal of supervised learning is to build a concise model of the distribution of class labels in terms of predictor features. The resulting classifier is then used to assign class labels to the testing instances where the values of the predictor features are known, but the value of the class label is unknown. This paper describes various classification algorithms and the recent attempt for improving classification accuracy—ensembles of classifiers.</description>
    <dc:title>Machine learning: a review of classification and combining techniques</dc:title>

    <dc:creator>S Kotsiantis</dc:creator>
    <dc:creator>I Zaharakis</dc:creator>
    <dc:creator>P Pintelas</dc:creator>
    <dc:identifier>doi:10.1007/s10462-007-9052-3</dc:identifier>
    <dc:source>Artificial Intelligence Review, Vol. 26, No. 3. (November 2006), pp. 159-190.</dc:source>
    <dc:date>2008-02-02T01:48:23-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Artificial Intelligence Review</prism:publicationName>
    <prism:volume>26</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>159</prism:startingPage>
    <prism:endingPage>190</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/312476">
    <title>Unsupervised learning of natural languages.</title>
    <link>http://www.citeulike.org/user/briordan/article/312476</link>
    <description>&lt;i&gt;Proc Natl Acad Sci U S A, Vol. 102, No. 33. (16 August 2005), pp. 11629-11634.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We address the problem, fundamental to linguistics, bioinformatics, and certain other disciplines, of using corpora of raw symbolic sequential data to infer underlying rules that govern their production. Given a corpus of strings (such as text, transcribed speech, chromosome or protein sequence data, sheet music, etc.), our unsupervised algorithm recursively distills from it hierarchically structured patterns. The adios (automatic distillation of structure) algorithm relies on a statistical method for pattern extraction and on structured generalization, two processes that have been implicated in language acquisition. It has been evaluated on artificial context-free grammars with thousands of rules, on natural languages as diverse as English and Chinese, and on protein data correlating sequence with function. This unsupervised algorithm is capable of learning complex syntax, generating grammatical novel sentences, and proving useful in other fields that call for structure discovery from raw data, such as bioinformatics.</description>
    <dc:title>Unsupervised learning of natural languages.</dc:title>

    <dc:creator>Z Solan</dc:creator>
    <dc:creator>D Horn</dc:creator>
    <dc:creator>E Ruppin</dc:creator>
    <dc:creator>S Edelman</dc:creator>
    <dc:identifier>doi:10.1073/pnas.0409746102</dc:identifier>
    <dc:source>Proc Natl Acad Sci U S A, Vol. 102, No. 33. (16 August 2005), pp. 11629-11634.</dc:source>
    <dc:date>2005-09-07T07:16:40-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Proc Natl Acad Sci U S A</prism:publicationName>
    <prism:issn>0027-8424</prism:issn>
    <prism:volume>102</prism:volume>
    <prism:number>33</prism:number>
    <prism:startingPage>11629</prism:startingPage>
    <prism:endingPage>11634</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>models</prism:category>
    <prism:category>syntactic-acquisition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2198867">
    <title>Statistical Computing with R</title>
    <link>http://www.citeulike.org/user/briordan/article/2198867</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Statistical Computing with R</dc:title>

    <dc:creator>Maria Rizzo</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-06T01:46:17-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publisher>Chapman &#38; Hall/CRC</prism:publisher>
    <prism:category>handbook</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>textbook</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2192875">
    <title>Using two-stage conditional word frequency models to model word burstiness and motivating TF-IDF</title>
    <link>http://www.citeulike.org/user/briordan/article/2192875</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Using two-stage conditional word frequency models to model word burstiness and motivating TF-IDF</dc:title>

    <dc:creator>Peter Sunehag</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-04T01:56:40-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>computational-lexical-semantics</prism:category>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2192865">
    <title>A latent space approach to dynamic embedding of co-occurrence data</title>
    <link>http://www.citeulike.org/user/briordan/article/2192865</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>A latent space approach to dynamic embedding of co-occurrence data</dc:title>

    <dc:creator>Purnamrita Sarkar</dc:creator>
    <dc:creator>Sajid Siddiqi</dc:creator>
    <dc:creator>Geoffrey Gordon</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-04T01:51:27-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2186656">
    <title>Incorporating prior knowledge on features into learning</title>
    <link>http://www.citeulike.org/user/briordan/article/2186656</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Incorporating prior knowledge on features into learning</dc:title>

    <dc:creator>Eyal Krupka</dc:creator>
    <dc:creator>Naftali Tishby</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-02T01:44:40-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2186649">
    <title>Hidden topic Markov models</title>
    <link>http://www.citeulike.org/user/briordan/article/2186649</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Hidden topic Markov models</dc:title>

    <dc:creator>Amit Gruber</dc:creator>
    <dc:creator>Michal Rosen-Zvi</dc:creator>
    <dc:creator>Yair Weiss</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-02T01:39:25-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>models</prism:category>
    <prism:category>topics-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2186645">
    <title>Fast search for Dirichlet process mixture models</title>
    <link>http://www.citeulike.org/user/briordan/article/2186645</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Fast search for Dirichlet process mixture models</dc:title>

    <dc:creator>Hal Daume</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-02T01:34:52-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2186641">
    <title>Visualizing similarity data with a mixture of maps</title>
    <link>http://www.citeulike.org/user/briordan/article/2186641</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Visualizing similarity data with a mixture of maps</dc:title>

    <dc:creator>James Cook</dc:creator>
    <dc:creator>Ilya Sutskever</dc:creator>
    <dc:creator>Andriy Mnih</dc:creator>
    <dc:creator>Geoffrey Hinton</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-02T01:30:24-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
    <prism:category>word-association</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2186636">
    <title>The Laplacian eigenmaps latent variable model</title>
    <link>http://www.citeulike.org/user/briordan/article/2186636</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>The Laplacian eigenmaps latent variable model</dc:title>

    <dc:creator>Miguel Careirra-Perpinan</dc:creator>
    <dc:creator>Zhengdong Lu</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-01-02T01:24:50-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2178376">
    <title>Identifying semantic equivalence for multi-document summarisation</title>
    <link>http://www.citeulike.org/user/briordan/article/2178376</link>
    <description>&lt;i&gt;Artificial Intelligence Review, Vol. 25, No. 1. (April 2006), pp. 55-65.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Abstract&#160;&#160;We describe Semantic Equivalence and Textual Entailment Recognition, and outline a system which uses a number of lexical, syntactic and semantic features to classify pairs of sentences as “semantically equivalent”. We describe an experiment to show how syntactic and semantic features improve the performance of an earlier system, which used only lexical features. We also outline some areas for future work.</description>
    <dc:title>Identifying semantic equivalence for multi-document summarisation</dc:title>

    <dc:creator>Eamonn Newman</dc:creator>
    <dc:creator>Joe Carthy</dc:creator>
    <dc:creator>John Dunnion</dc:creator>
    <dc:creator>Nicola Stokes</dc:creator>
    <dc:identifier>doi:10.1007/s10462-007-9018-5</dc:identifier>
    <dc:source>Artificial Intelligence Review, Vol. 25, No. 1. (April 2006), pp. 55-65.</dc:source>
    <dc:date>2007-12-29T01:46:54-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Artificial Intelligence Review</prism:publicationName>
    <prism:volume>25</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>55</prism:startingPage>
    <prism:endingPage>65</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2069894">
    <title>Randomized algorithms for the low-rank approximation of matrices</title>
    <link>http://www.citeulike.org/user/briordan/article/2069894</link>
    <description>&lt;i&gt;Proceedings of the National Academy of Sciences (5 December 2007), 0709640104.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe two recently proposed randomized algorithms for the construction of low-rank approximations to matrices, and demonstrate their application (inter alia) to the evaluation of the singular value decompositions of numerically low-rank matrices. Being probabilistic, the schemes described here have a finite probability of failure; in most cases, this probability is rather negligible (1017 is a typical value). In many situations, the new procedures are considerably more efficient and reliable than the classical (deterministic) ones; they also parallelize naturally. We present several numerical examples to illustrate the performance of the schemes. 10.1073/pnas.0709640104</description>
    <dc:title>Randomized algorithms for the low-rank approximation of matrices</dc:title>

    <dc:creator>Edo Liberty</dc:creator>
    <dc:creator>Franco Woolfe</dc:creator>
    <dc:creator>Per-Gunnar Martinsson</dc:creator>
    <dc:creator>Vladimir Rokhlin</dc:creator>
    <dc:creator>Mark Tygert</dc:creator>
    <dc:identifier>doi:10.1073/pnas.0709640104</dc:identifier>
    <dc:source>Proceedings of the National Academy of Sciences (5 December 2007), 0709640104.</dc:source>
    <dc:date>2007-12-06T23:55:18-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Proceedings of the National Academy of Sciences</prism:publicationName>
    <prism:startingPage>0709640104</prism:startingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2134463">
    <title>Seeking The Truly Correlated Topic Posterior: on tight approximate inference of logistic-normal admixture model</title>
    <link>http://www.citeulike.org/user/briordan/article/2134463</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Seeking The Truly Correlated Topic Posterior: on tight approximate inference of logistic-normal admixture model</dc:title>

    <dc:creator>Amr Ahmed</dc:creator>
    <dc:creator>Eric Xing</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2007-12-17T02:03:17-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>topics-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/1940101">
    <title>A Metropolis-Hastings algorithm for dynamic causal models</title>
    <link>http://www.citeulike.org/user/briordan/article/1940101</link>
    <description>&lt;i&gt;NeuroImage, Vol. 38, No. 3. (15 November 2007), pp. 478-487.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Dynamic causal modelling (DCM) is a modelling framework used to describe causal interactions in dynamical systems. It was developed to infer the causal architecture of networks of neuronal populations in the brain [Friston, K.J., Harrison, L, Penny, W., 2003. Dynamic causal modelling. NeuroImage. Aug; 19 (4): 1273-302]. In current formulations of DCM, the mean structure of the likelihood is a nonlinear and numerical function of the parameters, which precludes exact or analytic Bayesian inversion. To date, approximations to the posterior depend on the assumption of normality (i.e., the Laplace assumption). In particular, two arguments have been used to motivate normality of the prior and posterior distributions. First, Gaussian priors on the parameters are specified carefully to ensure that activity in the dynamic system of neuronal populations converges to a steady state (i.e., the dynamic system is dissipative). Secondly, normality of the posterior is an approximation based on general asymptotic results, regarding the form of the posterior under infinite data [Friston, K.J., Harrison, L, Penny, W., 2003. Dynamic causal modelling. NeuroImage. Aug; 19 (4): 1273-302]. Here, we provide a critique of these assumptions and evaluate them numerically. We use a Bayesian inversion scheme (the Metropolis-Hastings algorithm) that eschews both assumptions. This affords an independent route to the posterior and an external means to assess the performance of conventional schemes for DCM. It also allows us to assess the sensitivity of the posterior to different priors. First, we retain the conventional priors and compare the ensuing approximate posterior (Laplace) to the exact posterior (MCMC). Our analyses show that the Laplace approximation is appropriate for practical purposes. In a second, independent set of analyses, we compare the exact posterior under conventional priors with an exact posterior under newly defined uninformative priors. Reassuringly, we observe that the posterior is, for all practical purposes, insensitive of the choice of prior.</description>
    <dc:title>A Metropolis-Hastings algorithm for dynamic causal models</dc:title>

    <dc:creator>Justin Chumbley</dc:creator>
    <dc:creator>Karl Friston</dc:creator>
    <dc:creator>Tom Fearn</dc:creator>
    <dc:creator>Stefan Kiebel</dc:creator>
    <dc:identifier>doi:10.1016/j.neuroimage.2007.07.028</dc:identifier>
    <dc:source>NeuroImage, Vol. 38, No. 3. (15 November 2007), pp. 478-487.</dc:source>
    <dc:date>2007-11-19T22:34:31-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>NeuroImage</prism:publicationName>
    <prism:volume>38</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>478</prism:startingPage>
    <prism:endingPage>487</prism:endingPage>
    <prism:category>bayesian</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2126067">
    <title>Query expansion and dimensionality reduction: Notions of optimality in Rocchio relevance feedback and latent semantic indexing</title>
    <link>http://www.citeulike.org/user/briordan/article/2126067</link>
    <description>&lt;i&gt;Information Processing &#38; Management, Vol. 44, No. 1. (January 2008), pp. 163-180.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Rocchio relevance feedback and latent semantic indexing (LSI) are well-known extensions of the vector space model for information retrieval (IR). This paper analyzes the statistical relationship between these extensions. The analysis focuses on each method's basis in least-squares optimization. Noting that LSI and Rocchio relevance feedback both alter the vector space model in a way that is in some sense least-squares optimal, we ask: what is the relationship between LSI's and Rocchio's notions of optimality? What does this relationship imply for IR? Using an analytical approach, we argue that Rocchio relevance feedback is optimal if we understand retrieval as a simplified classification problem. On the other hand, LSI's motivation comes to the fore if we understand it as a biased regression technique, where projection onto a low-dimensional orthogonal subspace of the documents reduces model variance.</description>
    <dc:title>Query expansion and dimensionality reduction: Notions of optimality in Rocchio relevance feedback and latent semantic indexing</dc:title>

    <dc:creator>Miles Efron</dc:creator>
    <dc:identifier>doi:10.1016/j.ipm.2006.12.008</dc:identifier>
    <dc:source>Information Processing &#38; Management, Vol. 44, No. 1. (January 2008), pp. 163-180.</dc:source>
    <dc:date>2007-12-16T02:06:05-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Information Processing &#38; Management</prism:publicationName>
    <prism:volume>44</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>163</prism:startingPage>
    <prism:endingPage>180</prism:endingPage>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>distributional-similarity</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2113835">
    <title>Creating hierarchical categories using cell assemblies</title>
    <link>http://www.citeulike.org/user/briordan/article/2113835</link>
    <description>&lt;i&gt;pp. 1-24.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Highly recurrent neural networks can learn reverberating circuits called Cell Assemblies (CAs). These networks can be used to categorize input, and this paper explores the ability of CAs to learn hierarchical categories. A simulator, based on spiking fatiguing leaky integrators, is presented with instances of base categories. Learning is done using a compensatory Hebbian learning rule. The model takes advantage of overlapping CAs where neurons may participate in more than one CA. Using the unsupervised compensatory learning rule, the networks learn a hierarchy of categories that correctly categorize 97% of the basic level presentations of the input in our test. It categorizes 100% of the super-categories correctly. A larger hierarchy is learned that correctly categorizes 100% of base categories, and 89% of super-categories. It is also shown how novel subcategories gain default information from their super-category. These simulations show that networks containing CAs can be used to learn hierarchical categories. The network then can successfully categorize novel inputs.</description>
    <dc:title>Creating hierarchical categories using cell assemblies</dc:title>

    <dc:creator>Christian Huyck</dc:creator>
    <dc:source>pp. 1-24.</dc:source>
    <dc:date>2007-12-14T14:12:06-00:00</dc:date>
    <prism:startingPage>1</prism:startingPage>
    <prism:endingPage>24</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2113349">
    <title>Clustering of Count Data Using Generalized Dirichlet Multinomial Distributions</title>
    <link>http://www.citeulike.org/user/briordan/article/2113349</link>
    <description>&lt;i&gt;IEEE Transactions on Knowledge and Data Engineering (16 November 2007)&lt;/i&gt;</description>
    <dc:title>Clustering of Count Data Using Generalized Dirichlet Multinomial Distributions</dc:title>

    <dc:creator>Nizar Bouguila</dc:creator>
    <dc:source>IEEE Transactions on Knowledge and Data Engineering (16 November 2007)</dc:source>
    <dc:date>2007-12-14T12:18:10-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>IEEE Transactions on Knowledge and Data Engineering</prism:publicationName>
    <prism:publisher>IEEE Computer Society Digital Library</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2113337">
    <title>Explaining Classifications For Individual Instances</title>
    <link>http://www.citeulike.org/user/briordan/article/2113337</link>
    <description>&lt;i&gt;IEEE Transactions on Knowledge and Data Engineering (7 December 2007)&lt;/i&gt;</description>
    <dc:title>Explaining Classifications For Individual Instances</dc:title>

    <dc:creator>Marko Robnik-Sikon</dc:creator>
    <dc:creator>Igor Kononenko</dc:creator>
    <dc:source>IEEE Transactions on Knowledge and Data Engineering (7 December 2007)</dc:source>
    <dc:date>2007-12-14T12:13:22-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>IEEE Transactions on Knowledge and Data Engineering</prism:publicationName>
    <prism:publisher>IEEE Computer Society Digital Library</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>methods</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/2101496">
    <title>An enhanced self-organizing incremental neural network for online unsupervised learning</title>
    <link>http://www.citeulike.org/user/briordan/article/2101496</link>
    <description>&lt;i&gt;Neural Networks, Vol. 20, No. 8. (October 2007), pp. 893-903.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;An enhanced self-organizing incremental neural network (ESOINN) is proposed to accomplish online unsupervised learning tasks. It improves the self-organizing incremental neural network (SOINN) [Shen, F., Hasegawa, O. (2006a). An incremental network for on-line unsupervised classification and topology learning. Neural Networks, 19, 90-106] in the following respects: (1) it adopts a single-layer network to take the place of the two-layer network structure of SOINN; (2) it separates clusters with high-density overlap; (3) it uses fewer parameters than SOINN; and (4) it is more stable than SOINN. The experiments for both the artificial dataset and the real-world dataset also show that ESOINN works better than SOINN.</description>
    <dc:title>An enhanced self-organizing incremental neural network for online unsupervised learning</dc:title>

    <dc:creator>Shen Furao</dc:creator>
    <dc:creator>Tomotaka Ogura</dc:creator>
    <dc:creator>Osamu Hasegawa</dc:creator>
    <dc:identifier>doi:10.1016/j.neunet.2007.07.008</dc:identifier>
    <dc:source>Neural Networks, Vol. 20, No. 8. (October 2007), pp. 893-903.</dc:source>
    <dc:date>2007-12-13T01:41:43-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Neural Networks</prism:publicationName>
    <prism:volume>20</prism:volume>
    <prism:number>8</prism:number>
    <prism:startingPage>893</prism:startingPage>
    <prism:endingPage>903</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/1770144">
    <title>Extending boosting for large scale spoken language understanding</title>
    <link>http://www.citeulike.org/user/briordan/article/1770144</link>
    <description>&lt;i&gt;Machine Learning, Vol. 69, No. 1. (4 October 2007), pp. 55-74.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Abstract&#160;&#160; We propose three methods for extending the Boosting family of classifiers motivated by the real-life problems we have encountered. First, we propose a semisupervised learning method for exploiting the unlabeled data in Boosting. We then present a novel classification model adaptation method. The goal of adaptation is optimizing an existing model for a new target application, which is similar to the previous one but may have different classes or class distributions. Finally, we present an efficient and effective cost-sensitive classification method that extends Boosting to allow for weighted classes. We evaluated these methods for call classification in the AT&#38;T VoiceTone� spoken language understanding system. Our results indicate that it is possible to obtain the same classification performance by using 30% less labeled data when the unlabeled data is utilized through semisupervised learning. Using model adaptation we can achieve the same classification accuracy using less than half of the labeled data from the new application. Finally, we present significant improvements in the “important” (i.e., higher weighted) classes without a significant loss in overall performance using the proposed cost-sensitive classification method.</description>
    <dc:title>Extending boosting for large scale spoken language understanding</dc:title>

    <dc:creator>Gokhan Tur</dc:creator>
    <dc:identifier>doi:10.1007/s10994-007-5023-9</dc:identifier>
    <dc:source>Machine Learning, Vol. 69, No. 1. (4 October 2007), pp. 55-74.</dc:source>
    <dc:date>2007-10-15T12:59:00-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Machine Learning</prism:publicationName>
    <prism:volume>69</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>55</prism:startingPage>
    <prism:endingPage>74</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/briordan/article/1711091">
    <title>Large-Scale Kernel Machines</title>
    <link>http://www.citeulike.org/user/briordan/article/1711091</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Pervasive and networked computers have dramatically reduced the cost of collecting and distributing large datasets. In this context, machine learning algorithms that scale poorly could simply become irrelevant. We need learning algorithms that scale linearly with the volume of the data while maintaining enough statistical efficiency to outperform algorithms that simply process a random subset of the data. This volume offers researchers and engineers practical solutions for training kernel machines from large scale datasets, with detailed descriptions of algorithms and experiments carried out on realistically large datasets. After a detailed description of state-of-the-art kernel machine technology, an introduction of the essential concepts discussed in the volume, and a comparison of primal and dual optimization techniques, the book progresses from well-understood techniques to more novel and controversial approaches. Many contributors have made their code and data available online for further experimentation. Topics covered include fast implementations of known algorithms, approximations that are amenable to theoretical guarantees, and algorithms that perform well in practice but are difficult to analyze theoretically.</description>
    <dc:title>Large-Scale Kernel Machines</dc:title>

    <dc:source>(2007)</dc:source>
    <dc:date>2007-09-30T11:42:22-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



</rdf:RDF>

