<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Wed, 20 Aug 2008 21:17:33 BST</pubDate>


	<title>CiteULike: matwendt's statistical-nlp</title>
	<description>CiteULike: matwendt's statistical-nlp</description>


	<link>http://www.citeulike.org/user/matwendt/tag/statistical-nlp</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1856373"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1222866"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/105906"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1343015"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1342754"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1342717"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/833490"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/282193"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321514"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321502"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321490"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321399"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321396"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321385"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321376"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321372"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321357"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321340"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321308"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321306"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1321250"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1289617"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1287849"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1287839"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/1248098"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/matwendt/article/705498"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/matwendt/article/1856373">
    <title>Noun-Phrase Co-Occurence Statistics for Semi-Automatic Semantic Lexicon Construction</title>
    <link>http://www.citeulike.org/user/matwendt/article/1856373</link>
    <description>&lt;i&gt;(1998), pp. 1110-1116.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Generating semantic lexicons semiautomatically could be a great time saver, relative to creating them by hand. In this paper, we present an algorithm for extracting potential entries for a category from an on-line corpus, based upon a small set of exemplars. Our algorithm finds more correct terms and fewer incorrect ones than previous work in this area. Additionally, the entries that are generated potentially provide broader coverage of the category than vould occur to an individual coding them ...</description>
    <dc:title>Noun-Phrase Co-Occurence Statistics for Semi-Automatic Semantic Lexicon Construction</dc:title>

    <dc:creator>Brian Roark</dc:creator>
    <dc:creator>Eugene Charniak</dc:creator>
    <dc:source>(1998), pp. 1110-1116.</dc:source>
    <dc:date>2007-11-02T14:16:54-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>1110</prism:startingPage>
    <prism:endingPage>1116</prism:endingPage>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1222866">
    <title>Is Knowledge-Free Induction of Multiword Unit Dictionary Headwords a Solved Problem?</title>
    <link>http://www.citeulike.org/user/matwendt/article/1222866</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We seek a knowledge-free method for inducing multiword units from text corpora for use as machine-readable dictionary headwords. We provide two major evaluations of nine existing collocation-finders and illustrate the continuing need for improvement. We use Latent Semantic Analysis to make modest gains in performance, but we show the significant challenges encountered in trying this approach. 1</description>
    <dc:title>Is Knowledge-Free Induction of Multiword Unit Dictionary Headwords a Solved Problem?</dc:title>

    <dc:creator>Patrick Schone</dc:creator>
    <dc:creator>Daniel Jurafsky</dc:creator>
    <dc:date>2007-04-12T20:28:28-00:00</dc:date>
    <prism:category>corpus</prism:category>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/105906">
    <title>Foundations of Statistical Natural Language Processing</title>
    <link>http://www.citeulike.org/user/matwendt/article/105906</link>
    <description>&lt;i&gt;(18 June 1999)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;&#34;Statistical natural-language processing is, in my estimation, one of the most fast-moving and exciting areas of computer science these days. Anyone who wants to learn this field would be well advised to get this book. For that matter, the same goes for anyone who is already in the field. I know that it is going to be one of the most well-thumbed books on my bookshelf.&#34; -- Eugene Charniak, Department of Computer Science, Brown University &#60;P&#62;Statistical approaches to processing natural language text have become dominant in recent years. This foundational text is the first comprehensive introduction to statistical natural language processing (NLP) to appear. The book contains all the theory and algorithms needed for building NLP tools. It provides broad but rigorous coverage of mathematical and linguistic foundations, as well as detailed discussion of statistical methods, allowing students and researchers to construct their own implementations. The book covers collocation finding, word sense disambiguation, probabilistic parsing, information retrieval, and other applications. &#60;P&#62;More on this book</description>
    <dc:title>Foundations of Statistical Natural Language Processing</dc:title>

    <dc:creator>Christopher Manning</dc:creator>
    <dc:creator>Hinrich Schütze</dc:creator>
    <dc:source>(18 June 1999)</dc:source>
    <dc:date>2005-02-27T13:16:32-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publisher>The MIT Press</prism:publisher>
    <prism:category>introduction</prism:category>
    <prism:category>overview</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1343015">
    <title>Word space</title>
    <link>http://www.citeulike.org/user/matwendt/article/1343015</link>
    <description>&lt;i&gt;(1993)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Representations for semantic information about words are necessary for many applications of neural networks in natural language processing. This paper describes an efficient, corpus-based method for inducing distributed semantic representations for a large number of words (50,000) from lexical coccurrence statistics by means of a large-scale linear regression. The representations are successfully applied to word sense disambiguation using a nearest neighbor method.</description>
    <dc:title>Word space</dc:title>

    <dc:creator>Hinrich Schütze</dc:creator>
    <dc:source>(1993)</dc:source>
    <dc:date>2007-05-30T14:01:49-00:00</dc:date>
    <prism:publicationYear>1993</prism:publicationYear>
    <prism:publisher>Morgan Kaufmann Publishers</prism:publisher>
    <prism:category>co-occurrence</prism:category>
    <prism:category>disambiguation</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1342754">
    <title>A Data-Driven Method for Classifying Connective Phrases</title>
    <link>http://www.citeulike.org/user/matwendt/article/1342754</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper describes a three-stage methodology for investigating the semantics and pragmatics of sentence and clause connective phrases. The first step in the methodology is to assemble a large corpus of connectives. The second step is to organise this corpus into a hierarchical taxonomy of synonyms and hyponyms, using a pre-theoretical substitution test. The final step is to impose a theoretical interpretation on the taxonomy. The taxonomy lends itself to an analysis of...</description>
    <dc:title>A Data-Driven Method for Classifying Connective Phrases</dc:title>

    <dc:creator>Alistair Knott</dc:creator>
    <dc:creator>Chris Mellish</dc:creator>
    <dc:date>2007-05-30T12:38:14-00:00</dc:date>
    <prism:category>coherence</prism:category>
    <prism:category>corpus</prism:category>
    <prism:category>discourse</prism:category>
    <prism:category>nlp</prism:category>
    <prism:category>rst</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1342717">
    <title>Stochastic Text Generation</title>
    <link>http://www.citeulike.org/user/matwendt/article/1342717</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Introduction: generation and understanding Natural Language Generation (NLG) research aims at systems which produce coherent natural language text from an underlying representation of knowledge. Systems must produce language|single sentences or more complex discourses|which (i) faithfully represents the relevant knowledge, and also (ii) does this in a naturalsounding way. These have been termed the delity and uency goals, respectively (Ward 1993). The uency goal leads to important dierences...</description>
    <dc:title>Stochastic Text Generation</dc:title>

    <dc:creator>Jon Oberlander</dc:creator>
    <dc:creator>Chris Brew</dc:creator>
    <dc:date>2007-05-30T12:17:03-00:00</dc:date>
    <prism:category>fluency</prism:category>
    <prism:category>nlg</prism:category>
    <prism:category>pragmatics</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/833490">
    <title>Generation that Exploits Corpus-Based Statistical Knowledge</title>
    <link>http://www.citeulike.org/user/matwendt/article/833490</link>
    <description>&lt;i&gt;(1998), pp. 704-710.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe novel aspects of a new natural language generator called Nitrogen. This generator has a highly flexible input representation that allows a spectrum of input from syntactic to semantic depth, and shifts the burden of many linguistic decisions to the statistical post-processor. The generation algorithm is compositional, making it efficient, yet it also handles non-compositional aspects of language. Nitrogen's design makes it robust and scalable, operating with lexicons and knowledge...</description>
    <dc:title>Generation that Exploits Corpus-Based Statistical Knowledge</dc:title>

    <dc:creator>Irene Langkilde</dc:creator>
    <dc:creator>Kevin Knight</dc:creator>
    <dc:source>(1998), pp. 704-710.</dc:source>
    <dc:date>2006-09-07T08:32:38-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>704</prism:startingPage>
    <prism:endingPage>710</prism:endingPage>
    <prism:category>corpus</prism:category>
    <prism:category>lexical-choice</prism:category>
    <prism:category>nlg</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/282193">
    <title>Automatic acquisition of hyponyms from large text corpora</title>
    <link>http://www.citeulike.org/user/matwendt/article/282193</link>
    <description>&lt;i&gt;(1992), pp. 539-545.&lt;/i&gt;</description>
    <dc:title>Automatic acquisition of hyponyms from large text corpora</dc:title>

    <dc:creator>Marti Hearst</dc:creator>
    <dc:identifier>doi:10.3115/992133.992154</dc:identifier>
    <dc:source>(1992), pp. 539-545.</dc:source>
    <dc:date>2005-08-15T10:52:53-00:00</dc:date>
    <prism:publicationYear>1992</prism:publicationYear>
    <prism:startingPage>539</prism:startingPage>
    <prism:endingPage>545</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>corpus</prism:category>
    <prism:category>hyponym</prism:category>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>text-mining</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321514">
    <title>An Inductive-Learning Approach to Morphological Analysis</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321514</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Morphological analysis is an important subtask in text-to-speech conversion, hyphenation, and other language engineering tasks. The traditional approach to performing morphological analysis is to combine a morpheme lexicon, sets of (linguistic) rules, and heuristics to find a most probable analysis. In contrast, we present an inductive learning approach in which morphological analysis is reformulated as a segmentation task. We report on a number of experiments in which five inductive learning...</description>
    <dc:title>An Inductive-Learning Approach to Morphological Analysis</dc:title>

    <dc:creator>B Antal</dc:creator>
    <dc:creator>Walter</dc:creator>
    <dc:creator>D Weijters</dc:creator>
    <dc:date>2007-05-23T13:42:36-00:00</dc:date>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321502">
    <title>Unsupervised Learning of Derivational Morphology from Inflectional Lexicons</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321502</link>
    <description>&lt;i&gt;(1999)&lt;/i&gt;</description>
    <dc:title>Unsupervised Learning of Derivational Morphology from Inflectional Lexicons</dc:title>

    <dc:creator>Eric Gaussier</dc:creator>
    <dc:source>(1999)</dc:source>
    <dc:date>2007-05-23T13:36:56-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321490">
    <title>An automated learner for phonology and morphology</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321490</link>
    <description>&lt;i&gt;(1999)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This document is a summary, for ourselves and those who are curious, of the current state of our Phonological Learner. The Learner is the centerpiece of our current research project; it is a computer program whose purposes is to learn morphophonemic systems from input data, and to serve as a tool for modeling phonological and morphological knowledge in humans. 2. Rationale Linguists of many persuasions take a realist view of linguistic theory as it relates to learning: language learners, in...</description>
    <dc:title>An automated learner for phonology and morphology</dc:title>

    <dc:creator>A Albright</dc:creator>
    <dc:creator>B Hayes</dc:creator>
    <dc:source>(1999)</dc:source>
    <dc:date>2007-05-23T13:29:10-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:category>morphology</prism:category>
    <prism:category>phonology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321399">
    <title>Unsupervised Learning of Morphology Using a Novel Directed Search</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321399</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper describes a system for the unsupervised learning of morphological suffixes and stems from word lists. The system is composed of a generative probability model and a novel search algorithm.</description>
    <dc:title>Unsupervised Learning of Morphology Using a Novel Directed Search</dc:title>

    <dc:creator>Algorithm The</dc:creator>
    <dc:date>2007-05-23T13:06:12-00:00</dc:date>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321396">
    <title>A Bayesian Model for Morpheme and Paradigm Identification</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321396</link>
    <description>&lt;i&gt;(2001), pp. 482-490.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper describes a system for unsupervised learning of morphological affixes from texts or word lists. The system is composed of a generative probability model and a search algorithm. Experi- ments on the Wall Street Journal and the Hansard Corpus (French and English) demonstrate the effectiveness of this approach.</description>
    <dc:title>A Bayesian Model for Morpheme and Paradigm Identification</dc:title>

    <dc:creator>Matthew Snover</dc:creator>
    <dc:creator>Michael Brent</dc:creator>
    <dc:source>(2001), pp. 482-490.</dc:source>
    <dc:date>2007-05-23T13:04:01-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:startingPage>482</prism:startingPage>
    <prism:endingPage>490</prism:endingPage>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321385">
    <title>Unsupervised Learning of the Morphology of a Natural Language</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321385</link>
    <description>&lt;i&gt;Computational Linguistics, Vol. 27 (2001), pp. 153-198.&lt;/i&gt;</description>
    <dc:title>Unsupervised Learning of the Morphology of a Natural Language</dc:title>

    <dc:creator>John Goldsmith</dc:creator>
    <dc:source>Computational Linguistics, Vol. 27 (2001), pp. 153-198.</dc:source>
    <dc:date>2007-05-23T12:56:55-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>Computational Linguistics</prism:publicationName>
    <prism:volume>27</prism:volume>
    <prism:startingPage>153</prism:startingPage>
    <prism:endingPage>198</prism:endingPage>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321376">
    <title>A New Supervised Learning Algorithm for Word Sense Disambiguati on</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321376</link>
    <description>&lt;i&gt;(July 1997), pp. 604-609.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The Naive Mix is a new supervised learning algorithm that is based on a sequential method for selecting probabilistic models. The usual objective of model selection is to find a single model that adequately characterizes the data in a training sample. However, during model selection a sequence of models is generated that consists of the best--fitting model at each level of model complexity. The Naive Mix utilizes this sequence of models to define a probabilistic model which is then used as a...</description>
    <dc:title>A New Supervised Learning Algorithm for Word Sense Disambiguati on</dc:title>

    <dc:creator>T Pedersen</dc:creator>
    <dc:creator>R Bruce</dc:creator>
    <dc:source>(July 1997), pp. 604-609.</dc:source>
    <dc:date>2007-05-23T12:52:27-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:startingPage>604</prism:startingPage>
    <prism:endingPage>609</prism:endingPage>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>word-sense-disambiguation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321372">
    <title>Knowledge Lean Word Sense Disambiguation</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321372</link>
    <description>&lt;i&gt;(July 1998), pp. 800-805.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a corpus--based approach to word--sense disambiguation that only requires information that can be automatically extracted from untagged text. We use unsupervised techniques to estimate the parameters of a model describing the conditional distribution of the sense group given the known contextual features. Both the EM algorithm and Gibbs Sampling are evaluated to determine which is most appropriate for our data. We compare their disambiguation accuracy in an experiment with thirteen...</description>
    <dc:title>Knowledge Lean Word Sense Disambiguation</dc:title>

    <dc:creator>T Pedersen</dc:creator>
    <dc:creator>R Bruce</dc:creator>
    <dc:source>(July 1998), pp. 800-805.</dc:source>
    <dc:date>2007-05-23T12:50:23-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>800</prism:startingPage>
    <prism:endingPage>805</prism:endingPage>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>word-sense-disambiguation</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321357">
    <title>Resources for Morphology Learning and Evaluation</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321357</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Recently, there has been a proliferation of research into the acquisition of morphological grammars---that is, grammars and lexicons required for computer-based morphological analysis and synthesis. The approaches to acquiring such grammars range from tools which structure data provided by native speakers and linguists, to unsupervised machine learning. Despite this flurry of research into morphology learning, a means of comparing results among different approaches is largely lacking. This...</description>
    <dc:title>Resources for Morphology Learning and Evaluation</dc:title>

    <dc:creator>Mike Maxwell</dc:creator>
    <dc:date>2007-05-23T12:43:58-00:00</dc:date>
    <prism:category>assessment</prism:category>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321340">
    <title>Partially Supervised Learning of Morphology with Stochastic Transducers</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321340</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper I present an algorithm for the unsupervised learning of morphology using stochastic finite state transducers, in particular Pair Hidden Markov Models. The task is viewed as an alignment problem between two sets of words. A supervised model of morphology acquisition is converted to an unsupervised model by treating the alignment as a further hidden variable. The use of the Expectation-Maximisation algorithm for this task is studied, which leads to calculations involving the...</description>
    <dc:title>Partially Supervised Learning of Morphology with Stochastic Transducers</dc:title>

    <dc:creator>Alexander Clark</dc:creator>
    <dc:date>2007-05-23T12:34:47-00:00</dc:date>
    <prism:category>finite-state</prism:category>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321308">
    <title>Knowledge-Free Induction of Morphology Using Latent Semantic Analysis</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321308</link>
    <description>&lt;i&gt;(2000), pp. 67-72.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Morphology induction is a subproblem of important tasks like automatic learning of machine-readable dictionaries and grammar induction. Previous morphology induction approaches have relied solely on statistics of hypothesized stems and affixes to choose which axes to consider legitimate. Relying on stem-and-affix statistics rather than semantic knowledge leads to a number of problems, such as the inappropriate use of valid axes (&#34;ally&#34; stemming to &#34;all&#34;). We introduce a semantic-based algorithm ...</description>
    <dc:title>Knowledge-Free Induction of Morphology Using Latent Semantic Analysis</dc:title>

    <dc:creator>Patrick Schone</dc:creator>
    <dc:creator>Daniel Jurafsky</dc:creator>
    <dc:source>(2000), pp. 67-72.</dc:source>
    <dc:date>2007-05-23T12:15:17-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:startingPage>67</prism:startingPage>
    <prism:endingPage>72</prism:endingPage>
    <prism:publisher>Association for Computational Linguistics</prism:publisher>
    <prism:category>classification</prism:category>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321306">
    <title>Language-independent Induction of Part of Speech Class Labels Using Only Language Universals</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321306</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We introduce a language-independent strategy for inducing part of speech tags from corpora. Unlike other techniques that use language-specific lexicons, rulesets, and so forth to tag, our algorithm bootstraps only from cluster properties and language universals.</description>
    <dc:title>Language-independent Induction of Part of Speech Class Labels Using Only Language Universals</dc:title>

    <dc:creator>Patrick Schone</dc:creator>
    <dc:creator>Daniel Jurafsky</dc:creator>
    <dc:date>2007-05-23T12:14:17-00:00</dc:date>
    <prism:category>classification</prism:category>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>pos-tagging</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1321250">
    <title>A Markovian Lattice Model for the Acquisition of Morphological Structure</title>
    <link>http://www.citeulike.org/user/matwendt/article/1321250</link>
    <description>&lt;i&gt;(11 July 2001)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe a new formalism for word morphology. Our model views word generation as a random walk on a lattice of units where each unit is a set of (short) strings. The model naturally incorporates segmentation of words into morphemes. We capture the statistics of unit generation using a probabilistic suffix tree (PST) which is a variant of variable length Markov models. We present an efficient algorithm that learns a PST over the units whose output is a compact stochastic representation of ...</description>
    <dc:title>A Markovian Lattice Model for the Acquisition of Morphological Structure</dc:title>

    <dc:creator>Leonid Kontorovich</dc:creator>
    <dc:creator>Dana Ron</dc:creator>
    <dc:creator>Yoram Singer</dc:creator>
    <dc:source>(11 July 2001)</dc:source>
    <dc:date>2007-05-23T12:00:07-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:category>lexicon-acquisition</prism:category>
    <prism:category>morphology</prism:category>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>stemming</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1289617">
    <title>The Linguist's Guide to Statistics - Don't Panic</title>
    <link>http://www.citeulike.org/user/matwendt/article/1289617</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;ion. In the mean while, we refer the reader to [Jelinek &#38; Mercer 1980] for Deleted Interpolation, to [Good 1953] and [Katz 1987] for Good-Turing reestimation, and to [Samuelsson 1996] for Successive Abstraction.  58 CHAPTER 2. APPLIED STATISTICS  Chapter 3 Basic Corpus Linguistics 3.1 Empirical Evaluation Chinchor et al. write in Computational Linguistics 19(3): &#34;One of the common problems with evaluations is that the statistical significance of the results is unknown&#34;, [Chinchor et al...</description>
    <dc:title>The Linguist's Guide to Statistics - Don't Panic</dc:title>

    <dc:creator>Brigitte Krenn</dc:creator>
    <dc:creator>Christer Samuelsson</dc:creator>
    <dc:date>2007-05-11T11:14:37-00:00</dc:date>
    <prism:category>linguistics</prism:category>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>statistics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1287849">
    <title>Word Sense Disambiguation in Untagged Text based on Term Weight Learning</title>
    <link>http://www.citeulike.org/user/matwendt/article/1287849</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper describes unsupervised learning algorithm for disambiguating verbal word senses using term weight learning.</description>
    <dc:title>Word Sense Disambiguation in Untagged Text based on Term Weight Learning</dc:title>

    <dc:creator>Fumiyo And</dc:creator>
    <dc:date>2007-05-10T10:05:54-00:00</dc:date>
    <prism:category>disambiguation</prism:category>
    <prism:category>sense</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1287839">
    <title>Fast Statistical Parsing of Noun Phrases for Document Indexing</title>
    <link>http://www.citeulike.org/user/matwendt/article/1287839</link>
    <description>&lt;i&gt;(1997)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Information Retrieval (IR) is an important application area of Natural Language Processing (NLP) where one encounters the genuine challenge of processing large quantities of unrestricted natural language text. While much effort has been made to apply NLP techniques to IR, very few NLP techniques have been evaluated on a document collection larger than several megabytes. Many NLP techniques are simply not efficient enough, and not robust enough, to handle a large amount of text. This paper...</description>
    <dc:title>Fast Statistical Parsing of Noun Phrases for Document Indexing</dc:title>

    <dc:creator>C Zhai</dc:creator>
    <dc:source>(1997)</dc:source>
    <dc:date>2007-05-10T10:01:18-00:00</dc:date>
    <prism:publicationYear>1997</prism:publicationYear>
    <prism:category>chunking</prism:category>
    <prism:category>shallow-parsing</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/1248098">
    <title>Automatic Acquisition of a Large Subcategorization Dictionary from Corpora</title>
    <link>http://www.citeulike.org/user/matwendt/article/1248098</link>
    <description>&lt;i&gt;(1993), pp. 235-242.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents a new method for producing a dictionary of subcategorization frames from unlabelled text corpora. It is shown that statistical filtering of the results of a finite state parser running on the output of a stochastic tagger produces high quality results, despite the error rates of the tagger and the parser. Further, it is argued that this method can be used to learn all subcategorization frames, whereas previous methods are not extensible to a general solution to the problem. ...</description>
    <dc:title>Automatic Acquisition of a Large Subcategorization Dictionary from Corpora</dc:title>

    <dc:creator>Christopher Manning</dc:creator>
    <dc:source>(1993), pp. 235-242.</dc:source>
    <dc:date>2007-04-24T16:18:00-00:00</dc:date>
    <prism:publicationYear>1993</prism:publicationYear>
    <prism:startingPage>235</prism:startingPage>
    <prism:endingPage>242</prism:endingPage>
    <prism:category>statistical-nlp</prism:category>
    <prism:category>subcategorization</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/matwendt/article/705498">
    <title>Class-Based n-gram Models of Natural Language</title>
    <link>http://www.citeulike.org/user/matwendt/article/705498</link>
    <description>&lt;i&gt;Computational Linguistics, Vol. 18, No. 4. (1992), pp. 467-479.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We address the problem of predicting a word from previous words in a sample of text. In particular, we discuss n-gram models based on classes of words. We also discuss several statistical algorithms for assigning words to classes based on the frequency of their cooccurrence with other words. We find that we are able to extract classes that have the flavor of either syntactically based groupings or semantically based groupings, depending on the nature of the underlying statistics. 1 ...</description>
    <dc:title>Class-Based n-gram Models of Natural Language</dc:title>

    <dc:creator>Peter Brown</dc:creator>
    <dc:creator>Vincent Della Pietra</dc:creator>
    <dc:creator>Peter Desouza</dc:creator>
    <dc:creator>Jennifer Lai</dc:creator>
    <dc:creator>Robert Mercer</dc:creator>
    <dc:source>Computational Linguistics, Vol. 18, No. 4. (1992), pp. 467-479.</dc:source>
    <dc:date>2006-06-21T10:34:48-00:00</dc:date>
    <prism:publicationYear>1992</prism:publicationYear>
    <prism:publicationName>Computational Linguistics</prism:publicationName>
    <prism:volume>18</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>467</prism:startingPage>
    <prism:endingPage>479</prism:endingPage>
    <prism:category>classification</prism:category>
    <prism:category>co-occurrence</prism:category>
    <prism:category>n-gram</prism:category>
    <prism:category>statistical-nlp</prism:category>
</item>



</rdf:RDF>

