<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sun, 27 Jul 2008 08:22:49 BST</pubDate>


	<title>CiteULike: markusd's library [226 articles]</title>
	<description>CiteULike: markusd's library [226 articles]</description>


	<link>http://www.citeulike.org/user/markusd</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/965794"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2905903"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2919014"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2923062"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2925635"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2931375"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3003125"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3006057"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3006699"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2904428"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2911929"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3010801"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/1466789"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3001638"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/3015179"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/1321312"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2879987"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2877651"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2865762"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/404842"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2853679"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2649887"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2853609"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/438894"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2837648"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/1816299"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2098449"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2795079"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2795073"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2795060"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2416370"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2416377"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/474507"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2157295"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2296567"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2131744"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2731299"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2767135"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2393065"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2416208"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2347455"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/415566"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/105906"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/828999"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2766880"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/1454024"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/148945"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/2011105"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/110110"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/markusd/article/873540"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/markusd/article/965794">
    <title>Hierarchical Dirichlet Processes</title>
    <link>http://www.citeulike.org/user/markusd/article/965794</link>
    <description>&lt;i&gt;Journal of the American Statistical Association, Vol. 101, No. 476. (December 2006), pp. 1566-1581.&lt;/i&gt;</description>
    <dc:title>Hierarchical Dirichlet Processes</dc:title>

    <dc:creator>Teh</dc:creator>
    <dc:creator>Yee Whye</dc:creator>
    <dc:creator>Jordan</dc:creator>
    <dc:creator>I Michael</dc:creator>
    <dc:creator>Beal</dc:creator>
    <dc:creator>J Matthew</dc:creator>
    <dc:creator>Blei</dc:creator>
    <dc:creator>M David</dc:creator>
    <dc:identifier>doi:10.1198/016214506000000302</dc:identifier>
    <dc:source>Journal of the American Statistical Association, Vol. 101, No. 476. (December 2006), pp. 1566-1581.</dc:source>
    <dc:date>2006-11-29T01:37:01-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Journal of the American Statistical Association</prism:publicationName>
    <prism:issn>0162-1459</prism:issn>
    <prism:volume>101</prism:volume>
    <prism:number>476</prism:number>
    <prism:startingPage>1566</prism:startingPage>
    <prism:endingPage>1581</prism:endingPage>
    <prism:publisher>American Statistical Association</prism:publisher>
    <prism:category>dirichlet</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2905903">
    <title>Design of the Moses Decoder for Statistical Machine Translation</title>
    <link>http://www.citeulike.org/user/markusd/article/2905903</link>
    <description>&lt;i&gt;(June 2008), pp. 58-65.&lt;/i&gt;</description>
    <dc:title>Design of the Moses Decoder for Statistical Machine Translation</dc:title>

    <dc:creator>Hieu Hoang</dc:creator>
    <dc:creator>Philipp Koehn</dc:creator>
    <dc:source>(June 2008), pp. 58-65.</dc:source>
    <dc:date>2008-06-18T17:53:32-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:startingPage>58</prism:startingPage>
    <prism:endingPage>65</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2919014">
    <title>Fully Distributed EM for Very Large Datasets</title>
    <link>http://www.citeulike.org/user/markusd/article/2919014</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In EM and related algorithms, E-step compu- tations distribute easily, because data items are independent given parameters. For very large data sets, however, even storing all of the parameters in a single node for the M- step can be impractical. We present a frame- work that fully distributes the entire EM pro- cedure. Each node interacts only with pa- rameters relevant to its data, sending mes- sages to other nodes along a junction-tree topology. We demonstrate improvements over a MapReduce topology, on two tasks: word alignment and topic modeling.</description>
    <dc:title>Fully Distributed EM for Very Large Datasets</dc:title>

    <dc:creator>Jason Wolfe</dc:creator>
    <dc:creator>Aria Haghighi</dc:creator>
    <dc:creator>Dan Klein</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-06-23T14:31:04-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>em</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2923062">
    <title>Syntactic Reordering Integrated with Phrase-Based SMT</title>
    <link>http://www.citeulike.org/user/markusd/article/2923062</link>
    <description>&lt;i&gt;(2008), pp. 46-54.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a novel approach to word re- ordering which successfully integrates syn- tactic structural knowledge with phrase-based SMT. This is done by constructing a lattice of alternatives based on automatically learned probabilistic syntactic rules. In decoding, the alternatives are scored based on the output word order, not the order of the input. Un- like previous approaches, this makes it possi- ble to successfully integrate syntactic reorder- ing with phrase-based SMT. On an English- Danish task, we achieve an absolute improve- ment in translation quality of 1.1 % BLEU. Manual evaluation supports the claim that the present approach is signiﬁcantly superior to previous approaches.</description>
    <dc:title>Syntactic Reordering Integrated with Phrase-Based SMT</dc:title>

    <dc:creator>Jakob Elming</dc:creator>
    <dc:source>(2008), pp. 46-54.</dc:source>
    <dc:date>2008-06-24T10:25:47-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:startingPage>46</prism:startingPage>
    <prism:endingPage>54</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>reodering</prism:category>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2925635">
    <title>Multiple Reorderings in Phrase-Based Machine Translation</title>
    <link>http://www.citeulike.org/user/markusd/article/2925635</link>
    <description>&lt;i&gt;(June 2008), pp. 61-68.&lt;/i&gt;</description>
    <dc:title>Multiple Reorderings in Phrase-Based Machine Translation</dc:title>

    <dc:creator>Niyu Ge</dc:creator>
    <dc:creator>Abe Ittycheriah</dc:creator>
    <dc:creator>Kishore Papineni</dc:creator>
    <dc:source>(June 2008), pp. 61-68.</dc:source>
    <dc:date>2008-06-25T10:29:26-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:startingPage>61</prism:startingPage>
    <prism:endingPage>68</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>reordering</prism:category>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2931375">
    <title>A New String-to-Dependency Machine Translation Algorithm with a Target Dependency Language Model</title>
    <link>http://www.citeulike.org/user/markusd/article/2931375</link>
    <description>&lt;i&gt;(June 2008), pp. 577-585.&lt;/i&gt;</description>
    <dc:title>A New String-to-Dependency Machine Translation Algorithm with a Target Dependency Language Model</dc:title>

    <dc:creator>Libin Shen</dc:creator>
    <dc:creator>Jinxi Xu</dc:creator>
    <dc:creator>Ralph Weischedel</dc:creator>
    <dc:source>(June 2008), pp. 577-585.</dc:source>
    <dc:date>2008-06-26T15:57:47-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:startingPage>577</prism:startingPage>
    <prism:endingPage>585</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>lm</prism:category>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3003125">
    <title>Modeling Online Reviews with Multi-Grain Topic Models</title>
    <link>http://www.citeulike.org/user/markusd/article/3003125</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Modeling Online Reviews with Multi-Grain Topic Models</dc:title>

    <dc:creator>Ivan Titov</dc:creator>
    <dc:creator>Ryan Mcdonald</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-07-15T12:32:33-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
    <prism:category>topic-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3006057">
    <title>Name Translation in Statistical Machine Translation - Learning When to Transliterate</title>
    <link>http://www.citeulike.org/user/markusd/article/3006057</link>
    <description>&lt;i&gt;(June 2008), pp. 389-397.&lt;/i&gt;</description>
    <dc:title>Name Translation in Statistical Machine Translation - Learning When to Transliterate</dc:title>

    <dc:creator>Ulf Hermjakob</dc:creator>
    <dc:creator>Kevin Knight</dc:creator>
    <dc:creator>Hal Iii</dc:creator>
    <dc:source>(June 2008), pp. 389-397.</dc:source>
    <dc:date>2008-07-15T15:24:10-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:startingPage>389</prism:startingPage>
    <prism:endingPage>397</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>morphology-project</prism:category>
    <prism:category>name-transliteration</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3006699">
    <title>Measuring Word Alignment Quality for Statistical Machine Translation.</title>
    <link>http://www.citeulike.org/user/markusd/article/3006699</link>
    <description>&lt;i&gt;Computational Linguistics, Vol. 33, No. 3. (2007), pp. 293-303.&lt;/i&gt;</description>
    <dc:title>Measuring Word Alignment Quality for Statistical Machine Translation.</dc:title>

    <dc:creator>Alex Fraser</dc:creator>
    <dc:creator>Daniel Marcu</dc:creator>
    <dc:source>Computational Linguistics, Vol. 33, No. 3. (2007), pp. 293-303.</dc:source>
    <dc:date>2008-07-15T18:25:08-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Computational Linguistics</prism:publicationName>
    <prism:volume>33</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>293</prism:startingPage>
    <prism:endingPage>303</prism:endingPage>
    <prism:category>smt</prism:category>
    <prism:category>word-alignment</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2904428">
    <title>Accurate Max-margin Training for Structured Output Spaces.</title>
    <link>http://www.citeulike.org/user/markusd/article/2904428</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Accurate Max-margin Training for Structured Output Spaces.</dc:title>

    <dc:creator>Sunita Sarawagi</dc:creator>
    <dc:creator>Rahul Gupta</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-06-18T07:55:10-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2911929">
    <title>Bayesian Probabilistic Matrix Factorization using Markov Chain Monte Carlo.</title>
    <link>http://www.citeulike.org/user/markusd/article/2911929</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Bayesian Probabilistic Matrix Factorization using Markov Chain Monte Carlo.</dc:title>

    <dc:creator>Salakhyuditnov</dc:creator>
    <dc:creator>Mnih</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-06-21T04:03:24-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>bayes</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3010801">
    <title>Learning Classifiers from Only Positive and Unlabeled Data</title>
    <link>http://www.citeulike.org/user/markusd/article/3010801</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>Learning Classifiers from Only Positive and Unlabeled Data</dc:title>

    <dc:creator>Charles Elkan</dc:creator>
    <dc:creator>Keith Noto</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-07-17T00:09:48-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>discriminative</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>negative-evidence</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/1466789">
    <title>An Algorithm to Determine Peer-Reviewers</title>
    <link>http://www.citeulike.org/user/markusd/article/1466789</link>
    <description>&lt;i&gt;(24 May 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The peer-review process is the most widely accepted certification mechanism for legitimizing the written results of researchers within the scientific community. An essential component of this process is the identification of competent referees to review a submitted manuscript. This paper presents an algorithm to automatically determine the most appropriate reviewers for a manuscript by way of a co-authorship network data structure and a relative-rank particle-swarm algorithm. This approach is novel in that it is not limited to a pre-selected set of referees, is computationally efficient, requires no human-intervention, and can automatically identify conflict of interest situations. The algorithm is validated using referee bid data from the 2005 Joint Conference on Digital Libraries.</description>
    <dc:title>An Algorithm to Determine Peer-Reviewers</dc:title>

    <dc:creator>Marko Rodriguez</dc:creator>
    <dc:creator>Johan Bollen</dc:creator>
    <dc:source>(24 May 2006)</dc:source>
    <dc:date>2007-07-19T08:51:55-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
    <prism:category>misc</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3001638">
    <title>The Dynamic Hierarchical Dirichlet Process</title>
    <link>http://www.citeulike.org/user/markusd/article/3001638</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>The Dynamic Hierarchical Dirichlet Process</dc:title>

    <dc:creator>Lu Ren</dc:creator>
    <dc:creator>David Dunson</dc:creator>
    <dc:creator>Lawrence Carin</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-07-15T09:38:33-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/3015179">
    <title>Ultraconservative Online Algorithms for Multiclass Problems</title>
    <link>http://www.citeulike.org/user/markusd/article/3015179</link>
    <description>&lt;i&gt;Vol. 2111 (2001), pp. 99-115.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we study a paradigm to generalize online classification algorithms for binary classification problems to multiclass problems. The particular hypotheses we investigate maintain one prototype vector per class. Given an input instance, a multiclass hypothesis computes a similarityscore between each prototype and the input instance and sets the predicted label to be the index of the prototype achieving the highest similarity. To design and analyze the learning algorithms in this...</description>
    <dc:title>Ultraconservative Online Algorithms for Multiclass Problems</dc:title>

    <dc:creator>Koby Crammer</dc:creator>
    <dc:creator>Yoram Singer</dc:creator>
    <dc:source>Vol. 2111 (2001), pp. 99-115.</dc:source>
    <dc:date>2008-07-17T17:35:49-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:volume>2111</prism:volume>
    <prism:startingPage>99</prism:startingPage>
    <prism:endingPage>115</prism:endingPage>
    <prism:publisher>Springer, Berlin</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>mira</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/1321312">
    <title>Arabic morphology using only finite-state operations</title>
    <link>http://www.citeulike.org/user/markusd/article/1321312</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Finite-state morphology has been successful in the description and computational implementation of a wide variety of natural languages. However, the particular challenges of Arabic, and the limitations of some implementations of finite-state morphology, have led many researchers to believe that finite-state power was not sufficient to handle Arabic and other Semitic morphology. This paper illustrates how the morphotactics and the variation rules of Arabic have been described using only...</description>
    <dc:title>Arabic morphology using only finite-state operations</dc:title>

    <dc:creator>K Beesley</dc:creator>
    <dc:date>2007-05-23T12:19:30-00:00</dc:date>
    <prism:category>arabic</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2879987">
    <title>Nonparametric Bayesian Discrete Latent Variable Models for Unsupervised Learning</title>
    <link>http://www.citeulike.org/user/markusd/article/2879987</link>
    <description>&lt;i&gt;(20 April 2007)&lt;/i&gt;</description>
    <dc:title>Nonparametric Bayesian Discrete Latent Variable Models for Unsupervised Learning</dc:title>

    <dc:creator>Dilan Görür</dc:creator>
    <dc:source>(20 April 2007)</dc:source>
    <dc:date>2008-06-10T15:21:35-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>bayes</prism:category>
    <prism:category>hidden-variable</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>non-parametric</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2877651">
    <title>A Discriminative Latent Variable Model for Statistical Machine Translation</title>
    <link>http://www.citeulike.org/user/markusd/article/2877651</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>A Discriminative Latent Variable Model for Statistical Machine Translation</dc:title>

    <dc:creator>Phil Blunsom</dc:creator>
    <dc:creator>Trevor Cohn</dc:creator>
    <dc:creator>Miles Osborne</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-06-09T17:01:36-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>discriminative</prism:category>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2865762">
    <title>Discriminative Word Alignment with Conditional Random Fields</title>
    <link>http://www.citeulike.org/user/markusd/article/2865762</link>
    <description>&lt;i&gt;(July 2006), pp. 65-72.&lt;/i&gt;</description>
    <dc:title>Discriminative Word Alignment with Conditional Random Fields</dc:title>

    <dc:creator>Phil Blunsom</dc:creator>
    <dc:creator>Trevor Cohn</dc:creator>
    <dc:source>(July 2006), pp. 65-72.</dc:source>
    <dc:date>2008-06-05T14:51:15-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>65</prism:startingPage>
    <prism:endingPage>72</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>crf</prism:category>
    <prism:category>discriminative</prism:category>
    <prism:category>smt</prism:category>
    <prism:category>word-alignment</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/404842">
    <title>Grafting: fast, incremental feature selection by gradient descent in function space</title>
    <link>http://www.citeulike.org/user/markusd/article/404842</link>
    <description>&lt;i&gt;J. Mach. Learn. Res., Vol. 3 (2003), pp. 1333-1356.&lt;/i&gt;</description>
    <dc:title>Grafting: fast, incremental feature selection by gradient descent in function space</dc:title>

    <dc:creator>Simon Perkins</dc:creator>
    <dc:creator>Kevin Lacker</dc:creator>
    <dc:creator>James Theiler</dc:creator>
    <dc:source>J. Mach. Learn. Res., Vol. 3 (2003), pp. 1333-1356.</dc:source>
    <dc:date>2005-11-22T17:56:36-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>J. Mach. Learn. Res.</prism:publicationName>
    <prism:issn>1533-7928</prism:issn>
    <prism:volume>3</prism:volume>
    <prism:startingPage>1333</prism:startingPage>
    <prism:endingPage>1356</prism:endingPage>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>crf</prism:category>
    <prism:category>feature-selection</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2853679">
    <title>ParaMor: Minimally Supervised Induction of Paradigm Structure and Morphological Analysis</title>
    <link>http://www.citeulike.org/user/markusd/article/2853679</link>
    <description>&lt;i&gt;(June 2007), pp. 117-125.&lt;/i&gt;</description>
    <dc:title>ParaMor: Minimally Supervised Induction of Paradigm Structure and Morphological Analysis</dc:title>

    <dc:creator>Christian Monson</dc:creator>
    <dc:creator>Jaime Carbonell</dc:creator>
    <dc:creator>Alon Lavie</dc:creator>
    <dc:creator>Lori Levin</dc:creator>
    <dc:source>(June 2007), pp. 117-125.</dc:source>
    <dc:date>2008-05-31T21:16:22-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>117</prism:startingPage>
    <prism:endingPage>125</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2649887">
    <title>Efficient Multi-pass Decoding for Synchronous Context Free Grammars</title>
    <link>http://www.citeulike.org/user/markusd/article/2649887</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We take a multi-pass approach to ma- chine translation decoding when using syn- chronous context-free grammars as the trans- lation model and n-gram language models: the ﬁrst pass uses a bigram language model, and the resulting parse forest is used in the second pass to guide search with a trigram lan- guage model. The trigram pass closes most of the performance gap between a bigram de- coder and a much slower trigram decoder, but takes time that is insigniﬁcant in comparison to the bigram pass. An additional fast de- coding pass maximizing the expected count of correct translation hypotheses increases the BLEU score signiﬁcantly.</description>
    <dc:title>Efficient Multi-pass Decoding for Synchronous Context Free Grammars</dc:title>

    <dc:creator>Hao Zhang</dc:creator>
    <dc:creator>Daniel Gildea</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-04-10T16:25:23-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>smt</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2853609">
    <title>Phonological Constraints and Morphological Preprocessing for Grapheme-to-Phoneme Conversion</title>
    <link>http://www.citeulike.org/user/markusd/article/2853609</link>
    <description>&lt;i&gt;(June 2007), pp. 96-103.&lt;/i&gt;</description>
    <dc:title>Phonological Constraints and Morphological Preprocessing for Grapheme-to-Phoneme Conversion</dc:title>

    <dc:creator>Vera Demberg</dc:creator>
    <dc:creator>Helmut Schmid</dc:creator>
    <dc:creator>Gregor Möhler</dc:creator>
    <dc:source>(June 2007), pp. 96-103.</dc:source>
    <dc:date>2008-05-31T19:52:48-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>96</prism:startingPage>
    <prism:endingPage>103</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>joint-ngram</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/438894">
    <title>Latent Dirichlet allocation</title>
    <link>http://www.citeulike.org/user/markusd/article/438894</link>
    <description>&lt;i&gt;(2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe latent Dirichlet allocation (LDA), a generative probabilistic model for collections of discrete data such as text corpora. LDA is a three-level hierarchical Bayesian model, in which each item of a collection is modeled as a finite mixture over an underlying set of topics. Each topic is, in turn, modeled as an infinite mixture over an underlying set of topic probabilities. In the context of text modeling, the topic probabilities provide an explicit representation of a document....</description>
    <dc:title>Latent Dirichlet allocation</dc:title>

    <dc:creator>D Blei</dc:creator>
    <dc:creator>A Ng</dc:creator>
    <dc:creator>M Jordan</dc:creator>
    <dc:source>(2002)</dc:source>
    <dc:date>2005-12-15T14:31:27-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2837648">
    <title>Inducing Features of Random Fields</title>
    <link>http://www.citeulike.org/user/markusd/article/2837648</link>
    <description>&lt;i&gt;IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 19, No. 4. (1997), pp. 380-393.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a technique for constructing random fields from a set of training samples. The learning paradigm builds increasingly complex fields by allowing potential functions, or features, that are supported by increasingly large subgraphs. Each feature has a weight that is trained by minimizing the Kullback-Leibler divergence between the model and the empirical distribution of the training data. A greedy algorithm determines how features are incrementally added to the field and an iterative...</description>
    <dc:title>Inducing Features of Random Fields</dc:title>

    <dc:creator>Stephen Della Pietra</dc:creator>
    <dc:creator>Vincent Della Pietra</dc:creator>
    <dc:creator>John Lafferty</dc:creator>
    <dc:source>IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 19, No. 4. (1997), pp. 380-393.</dc:source>
    <dc:date>2008-05-27T14:26:23-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:publicationName>IEEE Transactions on Pattern Analysis and Machine Intelligence</prism:publicationName>
    <prism:volume>19</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>380</prism:startingPage>
    <prism:endingPage>393</prism:endingPage>
    <prism:category>crf</prism:category>
    <prism:category>feature-selection</prism:category>
    <prism:category>machine-learning</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/1816299">
    <title>Infinite Hidden Relational Models</title>
    <link>http://www.citeulike.org/user/markusd/article/1816299</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Relational learning analyzes the probabilistic constraints between the attributes of entities and relationships. We extend the expressiveness of relational models by introducing for each entity (or object) an infinitedimensional latent variable as part of a Dirichlet process (DP) mixture model. We discuss inference in the model, which is based on a DP Gibbs sampler, i.e., the Chinese restaurant process. We extended the Chinese restaurant process to be applicable to relational modeling. We discuss how information is propagated in the network of latent variables, reducing the necessity for extensive structural learning. In the context of a recommendation engine our approach realizes a principled solution for recommendations based on features of items, features of users and relational information. Our approach is evaluated in three applications: a recommendation system based on the Movie- Lens data set, the prediction of gene function using relational information and a medical recommendation system.</description>
    <dc:title>Infinite Hidden Relational Models</dc:title>

    <dc:creator>Zhao Xu</dc:creator>
    <dc:creator>Volker Tresp</dc:creator>
    <dc:creator>Kai Yu</dc:creator>
    <dc:creator>Hans-Peter Kriegel</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-10-24T17:32:55-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2098449">
    <title>Structured priors for structure learning</title>
    <link>http://www.citeulike.org/user/markusd/article/2098449</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Structured priors for structure learning</dc:title>

    <dc:creator>V Mansinghka</dc:creator>
    <dc:creator>C Kemp</dc:creator>
    <dc:creator>J Tenenbaum</dc:creator>
    <dc:creator>T Griffiths</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-12-12T12:38:36-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2795079">
    <title>Hidden conditional random fields for phone classification</title>
    <link>http://www.citeulike.org/user/markusd/article/2795079</link>
    <description>&lt;i&gt;(2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we show the novel application of hidden conditional random fields (HCRFs) -- conditional random fields with hidden state sequences -- for modeling speech. Hidden state sequences are critical for modeling the non-stationarity of speech signals. We show that HCRFs can easily be trained using the simple direct optimization technique of stochastic gradient descent. We present the results on the TIMIT phone classification task and show that HCRFs outperforms comparable ML and CML/MMI trained HMMs. In fact, HCRF results on this task are the best single classifier results known to us. We note that the HCRF framework is easily extensible to recognition since it is a state and label sequence modeling technique. We also note that HCRFs have the ability to handle complex features without any change in training procedure.</description>
    <dc:title>Hidden conditional random fields for phone classification</dc:title>

    <dc:creator>Asela Gunawardana</dc:creator>
    <dc:creator>Milind Mahajan</dc:creator>
    <dc:creator>Alex Acero</dc:creator>
    <dc:creator>John Platt</dc:creator>
    <dc:source>(2005)</dc:source>
    <dc:date>2008-05-13T13:56:00-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:category>crf</prism:category>
    <prism:category>discriminative</prism:category>
    <prism:category>hcrf</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2795073">
    <title>Training algorithms for hidden conditional random fields</title>
    <link>http://www.citeulike.org/user/markusd/article/2795073</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We investigate algorithms for training hidden conditional random fields (HCRFs) – a class of direct models with hidden state sequences. We compare stochastic gradient ascent with the RProp algorithm, and investigate stochastic versions of RProp. We propose a new scheme for model flattening, and compare it to the state of the art. Finally we give experimental results on the TIMIT phone classification task showing how these training options interact, comparing HCRFs to HMMs trained using extended Baum-Welch as well as stochastic gradient methods.</description>
    <dc:title>Training algorithms for hidden conditional random fields</dc:title>

    <dc:creator>Milind Mahajan</dc:creator>
    <dc:creator>Asela Gunawardana</dc:creator>
    <dc:creator>Alex Acero</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2008-05-13T13:54:20-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>crf</prism:category>
    <prism:category>discriminative</prism:category>
    <prism:category>hcrf</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2795060">
    <title>Regularization, Adaptation, and Non-Independent Features Improve Hidden Conditional Random Fields for Phone Classification</title>
    <link>http://www.citeulike.org/user/markusd/article/2795060</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Regularization, Adaptation, and Non-Independent Features Improve Hidden Conditional Random Fields for Phone Classification</dc:title>

    <dc:creator>Yun-Hsuan Sung</dc:creator>
    <dc:creator>Constantinos Boulis</dc:creator>
    <dc:creator>Christopher Manning</dc:creator>
    <dc:creator>Dan Jurafsky</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-05-13T13:48:02-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>crf</prism:category>
    <prism:category>discriminative</prism:category>
    <prism:category>hcrf</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2416370">
    <title>Morphology Induction from Limited Noisy Data Using Approximate String Matching</title>
    <link>http://www.citeulike.org/user/markusd/article/2416370</link>
    <description>&lt;i&gt;(June 2006), pp. 60-68.&lt;/i&gt;</description>
    <dc:title>Morphology Induction from Limited Noisy Data Using Approximate String Matching</dc:title>

    <dc:creator>Burcu Ayan</dc:creator>
    <dc:creator>David Doermann</dc:creator>
    <dc:creator>Amy Weinberg</dc:creator>
    <dc:source>(June 2006), pp. 60-68.</dc:source>
    <dc:date>2008-02-23T01:39:37-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>60</prism:startingPage>
    <prism:endingPage>68</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2416377">
    <title>Learning Probabilistic Paradigms for Morphology in a Latent Class Model</title>
    <link>http://www.citeulike.org/user/markusd/article/2416377</link>
    <description>&lt;i&gt;(June 2006), pp. 69-78.&lt;/i&gt;</description>
    <dc:title>Learning Probabilistic Paradigms for Morphology in a Latent Class Model</dc:title>

    <dc:creator>Erwin Chan</dc:creator>
    <dc:source>(June 2006), pp. 69-78.</dc:source>
    <dc:date>2008-02-23T01:42:38-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>69</prism:startingPage>
    <prism:endingPage>78</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/474507">
    <title>Factor graphs and the sum-product algorithm</title>
    <link>http://www.citeulike.org/user/markusd/article/474507</link>
    <description>&lt;i&gt;Information Theory, IEEE Transactions on, Vol. 47, No. 2. (2001), pp. 498-519.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Algorithms that must deal with complicated global functions of many variables often exploit the manner in which the given functions factor as a product of &#8220;local&#8221; functions, each of which depends on a subset of the variables. Such a factorization can be visualized with a bipartite graph that we call a factor graph, In this tutorial paper, we present a generic message-passing algorithm, the sum-product algorithm, that operates in a factor graph. Following a single, simple computational rule, the sum-product algorithm computes-either exactly or approximately-various marginal functions derived from the global function. A wide variety of algorithms developed in artificial intelligence, signal processing, and digital communications can be derived as specific instances of the sum-product algorithm, including the forward/backward algorithm, the Viterbi algorithm, the iterative &#8220;turbo&#8221; decoding algorithm, Pearl's (1988) belief propagation algorithm for Bayesian networks, the Kalman filter, and certain fast Fourier transform (FFT) algorithms</description>
    <dc:title>Factor graphs and the sum-product algorithm</dc:title>

    <dc:creator>FR Kschischang</dc:creator>
    <dc:creator>BJ Frey</dc:creator>
    <dc:creator>HA Loeliger</dc:creator>
    <dc:identifier>doi:10.1109/18.910572</dc:identifier>
    <dc:source>Information Theory, IEEE Transactions on, Vol. 47, No. 2. (2001), pp. 498-519.</dc:source>
    <dc:date>2006-01-21T22:06:50-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>Information Theory, IEEE Transactions on</prism:publicationName>
    <prism:volume>47</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>498</prism:startingPage>
    <prism:endingPage>519</prism:endingPage>
    <prism:category>machine-learning</prism:category>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2157295">
    <title>Inside-Outside Probability Computation for Belief Propagation</title>
    <link>http://www.citeulike.org/user/markusd/article/2157295</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we prove that the well-known correspondence between the forward-backward algorithm for hidden Markov models (HMMs) and belief propagation (BP) applied to HMMs can be generalized to one between BP for junction trees and the generalized inside-outside probability computation for probabilistic logic programs applied to junction trees.</description>
    <dc:title>Inside-Outside Probability Computation for Belief Propagation</dc:title>

    <dc:creator>Taisuke Sato</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2007-12-21T22:28:39-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>belief-propagation</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2296567">
    <title>An introduction to factor graphs</title>
    <link>http://www.citeulike.org/user/markusd/article/2296567</link>
    <description>&lt;i&gt;Signal Processing Magazine, IEEE, Vol. 21, No. 1. (2004), pp. 28-41.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Graphical models such as factor graphs allow a unified approach to a number of key topics in coding and signal processing such as the iterative decoding of turbo codes, LDPC codes and similar codes, joint decoding, equalization, parameter estimation, hidden-Markov models, Kalman filtering, and recursive least squares. Graphical models can represent complex real-world systems, and such representations help to derive practical detection/estimation algorithms in a wide area of applications. Most known signal processing techniques -including gradient methods, Kalman filtering, and particle methods -can be used as components of such algorithms. Other than most of the previous literature, we have used Forney-style factor graphs, which support hierarchical modeling and are compatible with standard block diagrams.</description>
    <dc:title>An introduction to factor graphs</dc:title>

    <dc:creator>HA Loeliger</dc:creator>
    <dc:identifier>doi:10.1109/MSP.2004.1267047</dc:identifier>
    <dc:source>Signal Processing Magazine, IEEE, Vol. 21, No. 1. (2004), pp. 28-41.</dc:source>
    <dc:date>2008-01-28T06:57:13-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Signal Processing Magazine, IEEE</prism:publicationName>
    <prism:volume>21</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>28</prism:startingPage>
    <prism:endingPage>41</prism:endingPage>
    <prism:category>graph</prism:category>
    <prism:category>graphical-models</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2131744">
    <title>Walk-Sums and Belief Propagation in Gaussian Graphical Models</title>
    <link>http://www.citeulike.org/user/markusd/article/2131744</link>
    <description>&lt;i&gt;Journal of Machine Learning Research, Vol. 7 (October 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a new framework based on walks in a graph for analysis and inference in Gaussian graphical models. The key idea is to decompose the correlation between each pair of variables as a sum over all walks between those variables in the graph. The weight of each walk is given by a product of edge-wise partial correlation coefficients. This representation holds for a large class of Gaussian graphical models which we call walk-summable. We give a precise characterization of this class of...</description>
    <dc:title>Walk-Sums and Belief Propagation in Gaussian Graphical Models</dc:title>

    <dc:creator>Dmitry Malioutov</dc:creator>
    <dc:creator>Jason Johnson</dc:creator>
    <dc:creator>Alan Willsky</dc:creator>
    <dc:source>Journal of Machine Learning Research, Vol. 7 (October 2006)</dc:source>
    <dc:date>2007-12-16T10:05:22-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Journal of Machine Learning Research</prism:publicationName>
    <prism:volume>7</prism:volume>
    <prism:category>belief-propagation</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2731299">
    <title>Understanding the Subprime Mortgage Crisis</title>
    <link>http://www.citeulike.org/user/markusd/article/2731299</link>
    <description>&lt;i&gt;Social Science Research Network Working Paper Series (29 February 2008)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Using loan-level data, we analyze the quality of subprime mortgage loans by adjusting their performance for differences in borrower characteristics, loan characteristics, and house price appreciation since origination. We find that the quality of loans deteriorated for six consecutive years before the crisis and that securitizers were, to some extent, aware of it. We provide evidence that the rise and fall of the subprime mortgage market follows a classic lending boom-bust scenario, in which unsustainable growth leads to the collapse of the market. Problems could have been detected long before the crisis, but they were masked by high house price appreciation between 2003 and 2005.</description>
    <dc:title>Understanding the Subprime Mortgage Crisis</dc:title>

    <dc:creator>Yuliya Demyanyk</dc:creator>
    <dc:creator>Otto Hemert</dc:creator>
    <dc:source>Social Science Research Network Working Paper Series (29 February 2008)</dc:source>
    <dc:date>2008-04-28T23:25:08-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publicationName>Social Science Research Network Working Paper Series</prism:publicationName>
    <prism:category>misc</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2767135">
    <title>The Infinite Hidden Markov Model</title>
    <link>http://www.citeulike.org/user/markusd/article/2767135</link>
    <description>&lt;i&gt;(2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We show that it is possible to extend hidden Markov models to have a countably infinite number of hidden states. By using the theory of Dirichlet processes we can implicitly integrate out the infinitely many transition parameters, leaving only three hyperparameters which can be learned from data. These three hyperparameters define a hierarchical Dirichlet process capable of capturing a rich set of transition dynamics. The three hyperparameters control the time scale of the dynamics, the...</description>
    <dc:title>The Infinite Hidden Markov Model</dc:title>

    <dc:creator>MJ Beal</dc:creator>
    <dc:creator>Z Ghahramani</dc:creator>
    <dc:creator>CE Rasmussen</dc:creator>
    <dc:source>(2002)</dc:source>
    <dc:date>2008-05-07T18:37:32-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2393065">
    <title>The Infinite Markov Model</title>
    <link>http://www.citeulike.org/user/markusd/article/2393065</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>The Infinite Markov Model</dc:title>

    <dc:creator>Daichi Mochihashi</dc:creator>
    <dc:creator>Eiichiro Sumita</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-02-18T09:13:26-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2416208">
    <title>Introduction: A Typological Approach to Algorithmic Morphology</title>
    <link>http://www.citeulike.org/user/markusd/article/2416208</link>
    <description>&lt;i&gt;(November 2007)&lt;/i&gt;</description>
    <dc:title>Introduction: A Typological Approach to Algorithmic Morphology</dc:title>

    <dc:creator>T Mayer</dc:creator>
    <dc:creator>B Wälchli</dc:creator>
    <dc:source>(November 2007)</dc:source>
    <dc:date>2008-02-23T00:49:29-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>morphology-project</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2347455">
    <title>Graph Walks and Graphical Models</title>
    <link>http://www.citeulike.org/user/markusd/article/2347455</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Inference in Markov random fields, and development and evaluation of similarity measures for nodes in graphs, are both active areas of data-mining research. In this paper, we demonstrate a formal connection between inference in tree-structured Markov random fields and personalized PageRank, a widely-used similarity measure for graph nodes based on graphwalks. In particular we show a connection between computation of marginal probabilities in tree-structured discrete-variable pairwise MRFs, and computation of similarity between vertices of a graph using the personalized PageRank measure: roughly speaking, for these MRFs, computing a marginal probability Pr(Xi = j) can be reduced to computing a small set of personalized-PageRank similarity vectors, followed by a very limited postprocessing stage.</description>
    <dc:title>Graph Walks and Graphical Models</dc:title>

    <dc:creator>William Cohen</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-02-07T01:24:26-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>graph</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/415566">
    <title>Graph Theory</title>
    <link>http://www.citeulike.org/user/markusd/article/415566</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;An effort has been made to present the various topics in the theory of graphs in a logical order, to indicate the historical background, and to clarify the exposition by including figures to illustrate concepts and results. In addition, there are three appendices which provide diagrams of graphs, directed graphs, and trees. The emphasis throughout is on theorems rather than algorithms or applications, which however are occaisionally mentioned.</description>
    <dc:title>Graph Theory</dc:title>

    <dc:creator>Frank Harary</dc:creator>
    <dc:date>2005-11-30T17:15:17-00:00</dc:date>
    <prism:publisher>Addison Wesley Publishing Company</prism:publisher>
    <prism:category>graphs</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/105906">
    <title>Foundations of Statistical Natural Language Processing</title>
    <link>http://www.citeulike.org/user/markusd/article/105906</link>
    <description>&lt;i&gt;(18 June 1999)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;&#34;Statistical natural-language processing is, in my estimation, one of the most fast-moving and exciting areas of computer science these days. Anyone who wants to learn this field would be well advised to get this book. For that matter, the same goes for anyone who is already in the field. I know that it is going to be one of the most well-thumbed books on my bookshelf.&#34; -- Eugene Charniak, Department of Computer Science, Brown University &#60;P&#62;Statistical approaches to processing natural language text have become dominant in recent years. This foundational text is the first comprehensive introduction to statistical natural language processing (NLP) to appear. The book contains all the theory and algorithms needed for building NLP tools. It provides broad but rigorous coverage of mathematical and linguistic foundations, as well as detailed discussion of statistical methods, allowing students and researchers to construct their own implementations. The book covers collocation finding, word sense disambiguation, probabilistic parsing, information retrieval, and other applications. &#60;P&#62;More on this book</description>
    <dc:title>Foundations of Statistical Natural Language Processing</dc:title>

    <dc:creator>Christopher Manning</dc:creator>
    <dc:creator>Hinrich Schtze</dc:creator>
    <dc:source>(18 June 1999)</dc:source>
    <dc:date>2005-02-27T13:16:32-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publisher>The MIT Press</prism:publisher>
    <prism:category>nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/828999">
    <title>Bayesian Computation Via the Gibbs Sampler and Related Markov Chain Monte Carlo Methods</title>
    <link>http://www.citeulike.org/user/markusd/article/828999</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The use of the Gibbs sampler for Bayesian computation is reviewed and illustrated in the context of some canonical examples. Other Markov chain Monte Carlo simulation methods are also briefly described, and comments are made on the advantages of sample-based approaches for Bayesian inference summaries.</description>
    <dc:title>Bayesian Computation Via the Gibbs Sampler and Related Markov Chain Monte Carlo Methods</dc:title>

    <dc:creator>AFM Smith</dc:creator>
    <dc:creator>GO Roberts</dc:creator>
    <dc:date>2006-09-05T17:59:27-00:00</dc:date>
    <prism:category>gibbs</prism:category>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2766880">
    <title>PCA versus LDA</title>
    <link>http://www.citeulike.org/user/markusd/article/2766880</link>
    <description>&lt;i&gt;IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 23, No. 2. (2001), pp. 228-233.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In the context of the appearance-based paradigm for object recognition, it is generally believed that algorithms based on LDA (Linear Discriminant Analysis) are superior to those based on PCA (Principal Components Analysis) . In this communication we show that this is not always the case. We present our case first by using intuitively plausible arguments and then by showing actual results on a face database. Our overall conclusion is that when the training dataset is small, PCA can outperform...</description>
    <dc:title>PCA versus LDA</dc:title>

    <dc:creator>Aleix Martinez</dc:creator>
    <dc:creator>Avinash Kak</dc:creator>
    <dc:source>IEEE Transactions on Pattern Analysis and Machine Intelligence, Vol. 23, No. 2. (2001), pp. 228-233.</dc:source>
    <dc:date>2008-05-07T16:01:07-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>IEEE Transactions on Pattern Analysis and Machine Intelligence</prism:publicationName>
    <prism:volume>23</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>228</prism:startingPage>
    <prism:endingPage>233</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/1454024">
    <title>PCA versus LDA</title>
    <link>http://www.citeulike.org/user/markusd/article/1454024</link>
    <description>&lt;i&gt;IEEE Trans. Pattern Anal. Mach. Intell., Vol. 23, No. 2. (February 2001), pp. 228-233.&lt;/i&gt;</description>
    <dc:title>PCA versus LDA</dc:title>

    <dc:creator>Aleix Mart&#8712;ez</dc:creator>
    <dc:creator>Avinash Kak</dc:creator>
    <dc:identifier>doi:10.1109/34.908974</dc:identifier>
    <dc:source>IEEE Trans. Pattern Anal. Mach. Intell., Vol. 23, No. 2. (February 2001), pp. 228-233.</dc:source>
    <dc:date>2007-07-13T12:09:22-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>IEEE Trans. Pattern Anal. Mach. Intell.</prism:publicationName>
    <prism:issn>0162-8828</prism:issn>
    <prism:volume>23</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>228</prism:startingPage>
    <prism:endingPage>233</prism:endingPage>
    <prism:publisher>IEEE Computer Society</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/148945">
    <title>Machine Learning</title>
    <link>http://www.citeulike.org/user/markusd/article/148945</link>
    <description>&lt;i&gt;(01 March 1997)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This book covers the field of machine learning, which is the study of algorithms that allow computer programs to automatically improve through experience. The book is intended to support upper level undergraduate and introductory level graduate courses in machine learning.</description>
    <dc:title>Machine Learning</dc:title>

    <dc:creator>Tom Mitchell</dc:creator>
    <dc:source>(01 March 1997)</dc:source>
    <dc:date>2005-04-03T20:00:27-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:publisher>McGraw-Hill Science/Engineering/Math</prism:publisher>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/2011105">
    <title>Exponential Priors for Maximum Entropy Models</title>
    <link>http://www.citeulike.org/user/markusd/article/2011105</link>
    <description>&lt;i&gt;(2003)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Maximum entropy models are a common modeling technique, but prone to overfitting. We show that using an exponential distribution as a prior leads to bounded absolute discounting by a constant. We show that this prior is better motivated by the data than previous techniques such as a Gaussian prior, and often produces lower error rates. Exponential priors also lead to a simpler learning algorithm and to easier to understand behavior. Furthermore, exponential priors help explain the...</description>
    <dc:title>Exponential Priors for Maximum Entropy Models</dc:title>

    <dc:creator>J Goodman</dc:creator>
    <dc:source>(2003)</dc:source>
    <dc:date>2007-11-29T06:34:47-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/110110">
    <title>The information bottleneck method</title>
    <link>http://www.citeulike.org/user/markusd/article/110110</link>
    <description>&lt;i&gt;(1999), pp. 368-377.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We define the relevant information in a signal x 2 X as being the information that this signal provides about another signal y 2 Y . Examples include the information that face images provide about the names of the people portrayed, or the information that speech sounds provide about the words spoken. Understanding the signal x requires more than just predicting y, it also requires specifying which features of X play a role in the prediction. We formalize the problem as that of finding a short...</description>
    <dc:title>The information bottleneck method</dc:title>

    <dc:creator>N Tishby</dc:creator>
    <dc:creator>F Pereira</dc:creator>
    <dc:creator>W Bialek</dc:creator>
    <dc:source>(1999), pp. 368-377.</dc:source>
    <dc:date>2005-03-02T06:57:17-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:startingPage>368</prism:startingPage>
    <prism:endingPage>377</prism:endingPage>
    <prism:category>machine-learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/markusd/article/873540">
    <title>Pattern Recognition and Machine Learning (Information Science and Statistics)</title>
    <link>http://www.citeulike.org/user/markusd/article/873540</link>
    <description>&lt;i&gt;(28 August 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The dramatic growth in practical applications for machine learning over the last ten years has been accompanied by many important developments in the underlying algorithms and techniques. For example, Bayesian methods have grown from a specialist niche to become mainstream, while graphical models have emerged as a general framework for describing and applying probabilistic techniques. The practical applicability of Bayesian methods has been greatly enhanced by the development of a range of approximate inference algorithms such as variational Bayes and expectation propagation, while new models based on kernels have had a significant impact on both algorithms and applications. This completely new textbook reflects these recent developments while providing a comprehensive introduction to the fields of pattern recognition and machine learning. It is aimed at advanced undergraduates or first-year PhD students, as well as researchers and practitioners. No previous knowledge of pattern recognition or machine learning concepts is assumed. Familiarity with multivariate calculus and basic linear algebra is required, and some experience in the use of probabilities would be helpful though not essential as the book includes a self-contained introduction to basic probability theory. The book is suitable for courses on machine learning, statistics, computer science, signal processing, computer vision, data mining, and bioinformatics. Extensive support is provided for course instructors, including more than 400 exercises, graded according to difficulty. Example solutions for a subset of the exercises are available from the book web site, while solutions for the remainder can be obtained by instructors from the publisher. The book is supported by a great deal of additional material, and the reader is encouraged to visit the book web site for the latest information. A forthcoming companion volume will deal with practical aspects of pattern recognition and machine learning, and will include free software implementations of the key algorithms along with example data sets and demonstration programs. Christopher Bishop is Assistant Director at Microsoft Research Cambridge, and also holds a Chair in Computer Science at the University of Edinburgh. He is a Fellow of Darwin College Cambridge, and was recently elected Fellow of the Royal Academy of Engineering. The author's previous textbook &#34;Neural Networks for Pattern Recognition&#34; has been widely adopted.</description>
    <dc:title>Pattern Recognition and Machine Learning (Information Science and Statistics)</dc:title>

    <dc:creator>Christopher Bishop</dc:creator>
    <dc:source>(28 August 2006)</dc:source>
    <dc:date>2006-09-26T12:22:37-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publisher>Springer</prism:publisher>
    <prism:category>machine-learning</prism:category>
    <prism:category>sum-product</prism:category>
</item>



</rdf:RDF>

