<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Wed, 20 Aug 2008 21:20:21 BST</pubDate>


	<title>CiteULike: lschilli's library [33 articles]</title>
	<description>CiteULike: lschilli's library [33 articles]</description>


	<link>http://www.citeulike.org/user/lschilli</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1453749"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/408748"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1161439"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1154147"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1151200"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1143604"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1138137"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1138062"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1132790"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/531106"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1129810"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1129808"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/191348"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1109766"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1103827"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1101067"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1039538"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1031686"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/308922"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/263034"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1002089"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1001226"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1001193"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1001104"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1000555"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/1000493"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/845449"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/876314"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/876278"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/875871"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/875719"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/875683"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/lschilli/article/875677"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/lschilli/article/1453749">
    <title>Corpus-Based Training of Action-Specific Language Models</title>
    <link>http://www.citeulike.org/user/lschilli/article/1453749</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Corpus-Based Training of Action-Specific Language Models</dc:title>

    <dc:creator>Lars Schillingmann</dc:creator>
    <dc:creator>Sven Wachsmuth</dc:creator>
    <dc:creator>Britta Wrede</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2007-07-13T10:06:54-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/408748">
    <title>The impact of spoken interfaces on the design of service robots</title>
    <link>http://www.citeulike.org/user/lschilli/article/408748</link>
    <description>&lt;i&gt;Industrial Robot: An International Journal, Vol. 32, No. 6. (January 2005), pp. 499-504.&lt;/i&gt;</description>
    <dc:title>The impact of spoken interfaces on the design of service robots</dc:title>

    <dc:creator>G Bugmann</dc:creator>
    <dc:creator>JC Wolf</dc:creator>
    <dc:creator>P Robinson</dc:creator>
    <dc:source>Industrial Robot: An International Journal, Vol. 32, No. 6. (January 2005), pp. 499-504.</dc:source>
    <dc:date>2005-11-25T17:03:59-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Industrial Robot: An International Journal</prism:publicationName>
    <prism:issn>0143-991X</prism:issn>
    <prism:volume>32</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>499</prism:startingPage>
    <prism:endingPage>504</prism:endingPage>
    <prism:publisher>Emerald Group Publishing Limited</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1161439">
    <title>Die Evaluierung von Spracherkennungssystemen in Deutschland</title>
    <link>http://www.citeulike.org/user/lschilli/article/1161439</link>
    <description>&lt;i&gt;(July 1995)&lt;/i&gt;</description>
    <dc:title>Die Evaluierung von Spracherkennungssystemen in Deutschland</dc:title>

    <dc:creator>Erwin Paulus</dc:creator>
    <dc:creator>Michael Lehning</dc:creator>
    <dc:source>(July 1995)</dc:source>
    <dc:date>2007-03-14T20:34:33-00:00</dc:date>
    <prism:publicationYear>1995</prism:publicationYear>
    <prism:publisher>TU Braunschweig</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1154147">
    <title>Principal Component Analysis</title>
    <link>http://www.citeulike.org/user/lschilli/article/1154147</link>
    <description>&lt;i&gt;(01 October 2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Principal component analysis is central to the study of multivariate data. Although one of the earliest multivariate techniques it continues to be the subject of much research, ranging from new model- based approaches to algorithmic ideas from neural networks. It is extremely versatile with applications in many disciplines. The first edition of this book was the first comprehensive text written solely on principal component analysis. The second edition updates and substantially expands the original version, and is once again the definitive text on the subject. It includes core material, current research and a wide range of applications. Its length is nearly double that of the first edition. Researchers in statistics, or in other fields that use principal component analysis, will find that the book gives an authoritative yet accessible account of the subject. It is also a valuable resource for graduate courses in multivariate analysis. The book requires some knowledge of matrix algebra. Ian Jolliffe is Professor of Statistics at the University of Aberdeen. He is author or co-author of over 60 research papers and three other books. His research interests are broad, but aspects of principal component analysis have fascinated him and kept him busy for over 30 years.</description>
    <dc:title>Principal Component Analysis</dc:title>

    <dc:creator>IT Jolliffe</dc:creator>
    <dc:source>(01 October 2002)</dc:source>
    <dc:date>2007-03-11T15:04:52-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publisher>Springer</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1151200">
    <title>Introduction To Algorithms</title>
    <link>http://www.citeulike.org/user/lschilli/article/1151200</link>
    <description>&lt;i&gt;(1998)&lt;/i&gt;</description>
    <dc:title>Introduction To Algorithms</dc:title>

    <dc:creator>Thomas Cormen</dc:creator>
    <dc:creator>Ronald Rivest</dc:creator>
    <dc:creator>Charles Leiserson</dc:creator>
    <dc:source>(1998)</dc:source>
    <dc:date>2007-03-09T13:48:08-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:publisher>The MIT Press</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1143604">
    <title>Taschenbuch der Mathematik</title>
    <link>http://www.citeulike.org/user/lschilli/article/1143604</link>
    <description>&lt;i&gt;(September 2000)&lt;/i&gt;</description>
    <dc:title>Taschenbuch der Mathematik</dc:title>

    <dc:creator>Ilja Bronstein</dc:creator>
    <dc:creator>Konstantin Semendjajew</dc:creator>
    <dc:creator>Gerhard Musiol</dc:creator>
    <dc:source>(September 2000)</dc:source>
    <dc:date>2007-03-06T12:51:13-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publisher>Deutsch (Harri)</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1138137">
    <title>Modelling the Effects of Speech Rate Variation for Automatic Speech Recognition</title>
    <link>http://www.citeulike.org/user/lschilli/article/1138137</link>
    <description>&lt;i&gt;(2002)&lt;/i&gt;</description>
    <dc:title>Modelling the Effects of Speech Rate Variation for Automatic Speech Recognition</dc:title>

    <dc:creator>B Wrede</dc:creator>
    <dc:source>(2002)</dc:source>
    <dc:date>2007-03-03T17:41:17-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1138062">
    <title>Handbuch zur Datenaufnahme und Transliteration in TP14 von VERBMOBIL -- 3.0</title>
    <link>http://www.citeulike.org/user/lschilli/article/1138062</link>
    <description>&lt;i&gt;Vol. VERBMOBIL Technisches Dokument Nr. 11 (September 1994)&lt;/i&gt;</description>
    <dc:title>Handbuch zur Datenaufnahme und Transliteration in TP14 von VERBMOBIL -- 3.0</dc:title>

    <dc:creator>Klaus Kohler</dc:creator>
    <dc:creator>Gloria Lex</dc:creator>
    <dc:creator>Matthias Pätzold</dc:creator>
    <dc:creator>Michael Scheffers</dc:creator>
    <dc:creator>Adrian Simpson</dc:creator>
    <dc:creator>Werner Thon</dc:creator>
    <dc:source>Vol. VERBMOBIL Technisches Dokument Nr. 11 (September 1994)</dc:source>
    <dc:date>2007-03-03T17:19:30-00:00</dc:date>
    <prism:publicationYear>1994</prism:publicationYear>
    <prism:volume>VERBMOBIL Technisches Dokument Nr. 11</prism:volume>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1132790">
    <title>On the Use of Information Retrieval Measures for Speech Recognition Evaluation</title>
    <link>http://www.citeulike.org/user/lschilli/article/1132790</link>
    <description>&lt;i&gt;No. 73. (2004)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper discusses the evaluation of automatic speech recognition (ASR) systems developed for practical applications, suggesting a set of criteria for application-oriented performance measures. The commonly used word error rate (WER), which poses ASR evaluation as a string editing process, is shown to have a number of limitations with respect to these criteria, motivating alternative or additional measures. This paper suggests that posing speech recognition evaluation as an information retrieval problem, where each word is one unit of information, offers a flexible framework for application-oriented performance analysis based on the concepts of recall and precision.</description>
    <dc:title>On the Use of Information Retrieval Measures for Speech Recognition Evaluation</dc:title>

    <dc:creator>I Mccowan</dc:creator>
    <dc:creator>D Moore</dc:creator>
    <dc:creator>J Dines</dc:creator>
    <dc:creator>Gatica Perez</dc:creator>
    <dc:creator>M Flynn</dc:creator>
    <dc:creator>P Wellner</dc:creator>
    <dc:creator>H Bourlard</dc:creator>
    <dc:source>No. 73. (2004)</dc:source>
    <dc:date>2007-03-01T01:43:20-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:number>73</prism:number>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/531106">
    <title>A Study of Cross-Validation and Bootstrap for Accuracy Estimation and Model Selection</title>
    <link>http://www.citeulike.org/user/lschilli/article/531106</link>
    <description>&lt;i&gt;(1995), pp. 1137-1145.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We review accuracy estimation methods and compare the two most common methods: crossvalidation and bootstrap. Recent experimental results on artificial data and theoretical results in restricted settings have shown that for selecting a good classifier from a set of classifiers (model selection), ten-fold cross-validation may be better than the more expensive leaveone -out cross-validation. We report on a largescale experiment---over half a million runs of C4.5 and a Naive-Bayes algorithm---to...</description>
    <dc:title>A Study of Cross-Validation and Bootstrap for Accuracy Estimation and Model Selection</dc:title>

    <dc:creator>Ron Kohavi</dc:creator>
    <dc:source>(1995), pp. 1137-1145.</dc:source>
    <dc:date>2006-03-05T17:32:28-00:00</dc:date>
    <prism:publicationYear>1995</prism:publicationYear>
    <prism:startingPage>1137</prism:startingPage>
    <prism:endingPage>1145</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1129810">
    <title>Generation of Language Models Using the Results of Image Analysis</title>
    <link>http://www.citeulike.org/user/lschilli/article/1129810</link>
    <description>&lt;i&gt;(1995), pp. 1739-1742.&lt;/i&gt;</description>
    <dc:title>Generation of Language Models Using the Results of Image Analysis</dc:title>

    <dc:creator>U Naeve</dc:creator>
    <dc:creator>G Socher</dc:creator>
    <dc:creator>GA Fink</dc:creator>
    <dc:creator>F Kummert</dc:creator>
    <dc:creator>G Sagerer</dc:creator>
    <dc:source>(1995), pp. 1739-1742.</dc:source>
    <dc:date>2007-02-28T15:24:55-00:00</dc:date>
    <prism:publicationYear>1995</prism:publicationYear>
    <prism:startingPage>1739</prism:startingPage>
    <prism:endingPage>1742</prism:endingPage>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1129808">
    <title>An Object-oriented Approach Using a Top-down and Bottom-up Process for Manipulative Action Recognition</title>
    <link>http://www.citeulike.org/user/lschilli/article/1129808</link>
    <description>&lt;i&gt;Vol. 4174 (2006), pp. 212-221.&lt;/i&gt;</description>
    <dc:title>An Object-oriented Approach Using a Top-down and Bottom-up Process for Manipulative Action Recognition</dc:title>

    <dc:creator>Zhe Li</dc:creator>
    <dc:creator>Jannik Fritsch</dc:creator>
    <dc:creator>Sven Wachsmuth</dc:creator>
    <dc:creator>Gerhard Sagerer</dc:creator>
    <dc:source>Vol. 4174 (2006), pp. 212-221.</dc:source>
    <dc:date>2007-02-28T15:24:39-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:volume>4174</prism:volume>
    <prism:startingPage>212</prism:startingPage>
    <prism:endingPage>221</prism:endingPage>
    <prism:publisher>Springer-Verlag</prism:publisher>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/191348">
    <title>Maintaining knowledge about temporal intervals</title>
    <link>http://www.citeulike.org/user/lschilli/article/191348</link>
    <description>&lt;i&gt;Communications of the ACM, Vol. 26, No. 11. (November 1983), pp. 832-843.&lt;/i&gt;</description>
    <dc:title>Maintaining knowledge about temporal intervals</dc:title>

    <dc:creator>James Allen</dc:creator>
    <dc:identifier>doi:10.1145/182.358434</dc:identifier>
    <dc:source>Communications of the ACM, Vol. 26, No. 11. (November 1983), pp. 832-843.</dc:source>
    <dc:date>2005-05-10T22:22:20-00:00</dc:date>
    <prism:publicationYear>1983</prism:publicationYear>
    <prism:publicationName>Communications of the ACM</prism:publicationName>
    <prism:issn>0001-0782</prism:issn>
    <prism:volume>26</prism:volume>
    <prism:number>11</prism:number>
    <prism:startingPage>832</prism:startingPage>
    <prism:endingPage>843</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1109766">
    <title>Linking Speech and Gesture in Multimodal Instruction Systems</title>
    <link>http://www.citeulike.org/user/lschilli/article/1109766</link>
    <description>&lt;i&gt;(6-8 September 2006), pp. 141-144.&lt;/i&gt;</description>
    <dc:title>Linking Speech and Gesture in Multimodal Instruction Systems</dc:title>

    <dc:creator>JC Wolf</dc:creator>
    <dc:creator>G Bugmann</dc:creator>
    <dc:source>(6-8 September 2006), pp. 141-144.</dc:source>
    <dc:date>2007-02-16T14:11:48-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>141</prism:startingPage>
    <prism:endingPage>144</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1103827">
    <title>Recent advances in the automatic recognition of audiovisual speech</title>
    <link>http://www.citeulike.org/user/lschilli/article/1103827</link>
    <description>&lt;i&gt;Proceedings of the IEEE, Vol. 91, No. 9. (2003), pp. 1306-1326.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Visual speech information from the speaker's mouth region has been successfully shown to improve noise robustness of automatic speech recognizers, thus promising to extend their usability in the human computer interface. In this paper, we review the main components of audiovisual automatic speech recognition (ASR) and present novel contributions in two main areas: first, the visual front-end design, based on a cascade of linear image transforms of an appropriate video region of interest, and subsequently, audiovisual speech integration. On the latter topic, we discuss new work on feature and decision fusion combination, the modeling of audiovisual speech asynchrony, and incorporating modality reliability estimates to the bimodal recognition process. We also briefly touch upon the issue of audiovisual adaptation. We apply our algorithms to three multisubject bimodal databases, ranging from small- to large-vocabulary recognition tasks, recorded in both visually controlled and challenging environments. Our experiments demonstrate that the visual modality improves ASR over all conditions and data considered, though less so for visually challenging environments and large vocabulary tasks.</description>
    <dc:title>Recent advances in the automatic recognition of audiovisual speech</dc:title>

    <dc:creator>G Potamianos</dc:creator>
    <dc:creator>C Neti</dc:creator>
    <dc:creator>G Gravier</dc:creator>
    <dc:creator>A Garg</dc:creator>
    <dc:creator>AW Senior</dc:creator>
    <dc:identifier>doi:10.1109/JPROC.2003.817150</dc:identifier>
    <dc:source>Proceedings of the IEEE, Vol. 91, No. 9. (2003), pp. 1306-1326.</dc:source>
    <dc:date>2007-02-12T23:55:39-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Proceedings of the IEEE</prism:publicationName>
    <prism:volume>91</prism:volume>
    <prism:number>9</prism:number>
    <prism:startingPage>1306</prism:startingPage>
    <prism:endingPage>1326</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1101067">
    <title>Hearing lips and seeing voices</title>
    <link>http://www.citeulike.org/user/lschilli/article/1101067</link>
    <description>&lt;i&gt;Nature, Vol. 264, No. 5588. (23 December 1976), pp. 746-748.&lt;/i&gt;</description>
    <dc:title>Hearing lips and seeing voices</dc:title>

    <dc:creator>Harry Mcgurk</dc:creator>
    <dc:creator>John Macdonald</dc:creator>
    <dc:identifier>doi:10.1038/264746a0</dc:identifier>
    <dc:source>Nature, Vol. 264, No. 5588. (23 December 1976), pp. 746-748.</dc:source>
    <dc:date>2007-02-11T20:51:50-00:00</dc:date>
    <prism:publicationYear>1976</prism:publicationYear>
    <prism:publicationName>Nature</prism:publicationName>
    <prism:volume>264</prism:volume>
    <prism:number>5588</prism:number>
    <prism:startingPage>746</prism:startingPage>
    <prism:endingPage>748</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1039538">
    <title>Automatische Spracherkennung: Grundlagen, statistische Modelle und effiziente Algorithmen</title>
    <link>http://www.citeulike.org/user/lschilli/article/1039538</link>
    <description>&lt;i&gt;(1995)&lt;/i&gt;</description>
    <dc:title>Automatische Spracherkennung: Grundlagen, statistische Modelle und effiziente Algorithmen</dc:title>

    <dc:creator>Ernst Schukat-Talamazzini</dc:creator>
    <dc:source>(1995)</dc:source>
    <dc:date>2007-01-13T15:16:29-00:00</dc:date>
    <prism:publicationYear>1995</prism:publicationYear>
    <prism:publisher>F. Vieweg</prism:publisher>
    <prism:category>books</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1031686">
    <title>Mustererkennung mit Markov-Modellen</title>
    <link>http://www.citeulike.org/user/lschilli/article/1031686</link>
    <description>&lt;i&gt;(31 October 2003)&lt;/i&gt;</description>
    <dc:title>Mustererkennung mit Markov-Modellen</dc:title>

    <dc:creator>Gernot Fink</dc:creator>
    <dc:source>(31 October 2003)</dc:source>
    <dc:date>2007-01-09T17:14:19-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publisher>Teubner B.G. GmbH</prism:publisher>
    <prism:category>books</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/308922">
    <title>Statistical Methods for Speech Recognition</title>
    <link>http://www.citeulike.org/user/lschilli/article/308922</link>
    <description>&lt;i&gt;(16 January 1998)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This book reflects decades of important research on the mathematical foundations of speech recognition. It focuses on underlying statistical techniques such as hidden Markov models, decision trees, the expectation-maximization algorithm, information theoretic goodness criteria, maximum entropy probability estimation, parameter and data clustering, and smoothing of probability distributions. The author's goal is to present these principles clearly in the simplest setting, to show the advantages of self-organization from real data, and to enable the reader to apply the techniques.</description>
    <dc:title>Statistical Methods for Speech Recognition</dc:title>

    <dc:creator>Frederick Jelinek</dc:creator>
    <dc:source>(16 January 1998)</dc:source>
    <dc:date>2005-08-31T14:41:48-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:publisher>The MIT Press</prism:publisher>
    <prism:category>books</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/263034">
    <title>Spoken Language Processing: A Guide to Theory, Algorithm and System Development</title>
    <link>http://www.citeulike.org/user/lschilli/article/263034</link>
    <description>&lt;i&gt;(25 April 2001)&lt;/i&gt;</description>
    <dc:title>Spoken Language Processing: A Guide to Theory, Algorithm and System Development</dc:title>

    <dc:creator>Xuedong Huang</dc:creator>
    <dc:creator>Alex Acero</dc:creator>
    <dc:creator>Hsiao-Wuen Hon</dc:creator>
    <dc:source>(25 April 2001)</dc:source>
    <dc:date>2005-07-22T23:53:57-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publisher>Prentice Hall PTR</prism:publisher>
    <prism:category>books</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1002089">
    <title>Incremental Speech Recognition for Multimodal Interfaces</title>
    <link>http://www.citeulike.org/user/lschilli/article/1002089</link>
    <description>&lt;i&gt;(September 1998), pp. 2012-2017.&lt;/i&gt;</description>
    <dc:title>Incremental Speech Recognition for Multimodal Interfaces</dc:title>

    <dc:creator>GA Fink</dc:creator>
    <dc:creator>C Schillo</dc:creator>
    <dc:creator>F Kummert</dc:creator>
    <dc:creator>G Sagerer</dc:creator>
    <dc:source>(September 1998), pp. 2012-2017.</dc:source>
    <dc:date>2006-12-19T16:15:34-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>2012</prism:startingPage>
    <prism:endingPage>2017</prism:endingPage>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1001226">
    <title>Robust Audiovisual Integration using Semicontinuous Hidden Markov Models</title>
    <link>http://www.citeulike.org/user/lschilli/article/1001226</link>
    <description>&lt;i&gt;Vol. 1 (1996), pp. 42-45.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe an improved method of integrating audio and visual information in a HMM-based audiovisual ASR system. The method uses a modified semi-continuous HMM (SCHMM) for integration and recognition. Our results show substantial improvements over earlier integration methods at high noise levels.</description>
    <dc:title>Robust Audiovisual Integration using Semicontinuous Hidden Markov Models</dc:title>

    <dc:creator>Q Su</dc:creator>
    <dc:creator>PL Silsbee</dc:creator>
    <dc:source>Vol. 1 (1996), pp. 42-45.</dc:source>
    <dc:date>2006-12-19T01:06:43-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:volume>1</prism:volume>
    <prism:startingPage>42</prism:startingPage>
    <prism:endingPage>45</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1001193">
    <title>Improving Speech Recognition on a Mobile Robot Platform through the use of Top-Down Visual Queues</title>
    <link>http://www.citeulike.org/user/lschilli/article/1001193</link>
    <description>&lt;i&gt;(9-15 August 2003)&lt;/i&gt;</description>
    <dc:title>Improving Speech Recognition on a Mobile Robot Platform through the use of Top-Down Visual Queues</dc:title>

    <dc:creator>RJ Ross</dc:creator>
    <dc:creator>RPS O'Donoghue</dc:creator>
    <dc:creator>GMP O'Hare</dc:creator>
    <dc:source>(9-15 August 2003)</dc:source>
    <dc:date>2006-12-19T00:38:12-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publisher>AAAI Press</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1001104">
    <title>Audio-Visual Large Vocabulary Continuous Speech Recognition in the Broadcast Domain</title>
    <link>http://www.citeulike.org/user/lschilli/article/1001104</link>
    <description>&lt;i&gt;(1999)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We consider the problem of combining visual cues with audio signals for the purpose of improved automatic machine recognition of speech. Although signifcant progress has been made in machine transcription of large vocabulary continuous speech (LVCSR) over the last few years, the technology to date is most eective only under controlled conditions such as low noise, speaker dependent recognition and read speech (as opposed to conversational speech) etc. On the otherhand, while augmenting the...</description>
    <dc:title>Audio-Visual Large Vocabulary Continuous Speech Recognition in the Broadcast Domain</dc:title>

    <dc:creator>S Basu</dc:creator>
    <dc:creator>C Neti</dc:creator>
    <dc:creator>A Senior</dc:creator>
    <dc:creator>N Rajput</dc:creator>
    <dc:creator>L Subramanium</dc:creator>
    <dc:creator>A Verma</dc:creator>
    <dc:source>(1999)</dc:source>
    <dc:date>2006-12-19T00:08:26-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1000555">
    <title>Using the Visual Component in Automatic Speech Recognition</title>
    <link>http://www.citeulike.org/user/lschilli/article/1000555</link>
    <description>&lt;i&gt;Vol. 3 (1996), pp. 1656-1659.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The movements of talkers' faces are known to convey visual cues that can improve speech intelligibility, especially where there is noise or hearing-impairment. This suggests that visible facial gestures could be exploited to enhance speech intelligibility in automatic systems. Handling the volume of data represented by images of talkers' faces implies some form of data compression. Rather than using conventional feature extraction approaches, image coding and compression can be achieved using...</description>
    <dc:title>Using the Visual Component in Automatic Speech Recognition</dc:title>

    <dc:creator>NM Brooke</dc:creator>
    <dc:source>Vol. 3 (1996), pp. 1656-1659.</dc:source>
    <dc:date>2006-12-18T20:17:37-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:volume>3</prism:volume>
    <prism:startingPage>1656</prism:startingPage>
    <prism:endingPage>1659</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/1000493">
    <title>Audio-Visual Speech Recognition, Final Workshop 2000 Report</title>
    <link>http://www.citeulike.org/user/lschilli/article/1000493</link>
    <description>&lt;i&gt;(12 October 2000)&lt;/i&gt;</description>
    <dc:title>Audio-Visual Speech Recognition, Final Workshop 2000 Report</dc:title>

    <dc:creator>C Neti</dc:creator>
    <dc:creator>G Potamianos</dc:creator>
    <dc:creator>J Luettin</dc:creator>
    <dc:creator>I Matthews</dc:creator>
    <dc:creator>H Glotin</dc:creator>
    <dc:creator>D Vergyri</dc:creator>
    <dc:creator>J Sison</dc:creator>
    <dc:creator>A Mashari</dc:creator>
    <dc:creator>J Zhou</dc:creator>
    <dc:source>(12 October 2000)</dc:source>
    <dc:date>2006-12-18T18:27:13-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/845449">
    <title>Automatic Detection of Song Changes in Music Mixes Using Stochastic Models</title>
    <link>http://www.citeulike.org/user/lschilli/article/845449</link>
    <description>&lt;i&gt;Vol. 3 (2006), pp. 665-668.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The annotation of song changes in music mixes created by DJs or radio stations for direct access in digital recordings is, usually, a very tedious work. In order to support this process we developed an automatic song change detection method which can be used for arbitrary music mixes. Stochastic models are applied to music data aiming at their segmentation with respect to automatically obtained abstract generic acoustic units. The local analysis of these stochastic music models provides hypotheses for song changes. Results of an experimental evaluation processing music mix data demonstrate the effectiveness of our method for supporting the annotation with respect to song changes.</description>
    <dc:title>Automatic Detection of Song Changes in Music Mixes Using Stochastic Models</dc:title>

    <dc:creator>Thomas Plötz</dc:creator>
    <dc:creator>Gernot Fink</dc:creator>
    <dc:creator>Peter Husemann</dc:creator>
    <dc:creator>Sven Kanies</dc:creator>
    <dc:creator>Kai Lienemann</dc:creator>
    <dc:creator>Tobias Marschall</dc:creator>
    <dc:creator>Marcel Martin</dc:creator>
    <dc:creator>Lars Schillingmann</dc:creator>
    <dc:creator>Matthias Steinrücken</dc:creator>
    <dc:creator>Henner Sudek</dc:creator>
    <dc:source>Vol. 3 (2006), pp. 665-668.</dc:source>
    <dc:date>2006-09-15T14:05:10-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:volume>3</prism:volume>
    <prism:startingPage>665</prism:startingPage>
    <prism:endingPage>668</prism:endingPage>
    <prism:publisher>IEEE</prism:publisher>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/876314">
    <title>Lexicalized grammar acquisition</title>
    <link>http://www.citeulike.org/user/lschilli/article/876314</link>
    <description>&lt;i&gt;(2003)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents a formalization of automatic grammar acquisition that is based on lexicalized grammar formalisms (e.g. LTAG and HPSG). We state the conditions for the consistent ac- quisition of a unique lexicalized grammar from an annotated corpus.</description>
    <dc:title>Lexicalized grammar acquisition</dc:title>

    <dc:creator>M Ninomiya</dc:creator>
    <dc:creator>T Tsujii</dc:creator>
    <dc:source>(2003)</dc:source>
    <dc:date>2006-09-28T12:04:23-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/876278">
    <title>Towards automatic grammar acquisition from a bracketed corpus</title>
    <link>http://www.citeulike.org/user/lschilli/article/876278</link>
    <description>&lt;i&gt;(1996)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we propose a method to group brackets in a bracketed corpus (with lexical tags), according to their local contextual information, as a first step towards the automatic acquisition of a context-free grammar. Using a bracketed corpus, the learning task is reduced to the problem of how to determine the nonterminal label of each bracket in the corpus. In a grouping process, a single nonterminal label is assigned to each group of brackets which are similar. Two techniques,...</description>
    <dc:title>Towards automatic grammar acquisition from a bracketed corpus</dc:title>

    <dc:creator>Thanaruk Theeramunkong</dc:creator>
    <dc:creator>Manabu Okumura</dc:creator>
    <dc:source>(1996)</dc:source>
    <dc:date>2006-09-28T10:25:59-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/875871">
    <title>Zeitsynchrone Suche mit n-Gramm-Modellen h&#246;herer Ordnung</title>
    <link>http://www.citeulike.org/user/lschilli/article/875871</link>
    <description>&lt;i&gt;(2000), pp. 145-150.&lt;/i&gt;</description>
    <dc:title>Zeitsynchrone Suche mit n-Gramm-Modellen h&#246;herer Ordnung</dc:title>

    <dc:creator>GA Fink</dc:creator>
    <dc:creator>G Sagerer</dc:creator>
    <dc:source>(2000), pp. 145-150.</dc:source>
    <dc:date>2006-09-27T23:33:56-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:startingPage>145</prism:startingPage>
    <prism:endingPage>150</prism:endingPage>
    <prism:publisher>VDE Verlag</prism:publisher>
    <prism:category>bibtex-import</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/875719">
    <title>Learning visually grounded words and syntax of natural spoken language</title>
    <link>http://www.citeulike.org/user/lschilli/article/875719</link>
    <description>&lt;i&gt;Evolution of Communication, Vol. 4, No. 1. (2001), pp. 33-56.&lt;/i&gt;</description>
    <dc:title>Learning visually grounded words and syntax of natural spoken language</dc:title>

    <dc:creator>Deb Roy</dc:creator>
    <dc:source>Evolution of Communication, Vol. 4, No. 1. (2001), pp. 33-56.</dc:source>
    <dc:date>2006-09-27T15:06:54-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>Evolution of Communication</prism:publicationName>
    <prism:volume>4</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>33</prism:startingPage>
    <prism:endingPage>56</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/875683">
    <title>Learning visually-grounded words and syntax for a scene description task</title>
    <link>http://www.citeulike.org/user/lschilli/article/875683</link>
    <description>&lt;i&gt;Computer Speech and Language (2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A spoken language generation system has been developed that learns to describe objects in computer-generated visual scenes. The system is trained by a `show-and-tell' procedure in which visual scenes are paired with natural language descriptions. Learning algorithms acquire probabilistic structures which encode the visual semantics of phrase structure, word classes, and individual words. Using these structures, a planning algorithm integrates syntactic, semantic, and contextual constraints to...</description>
    <dc:title>Learning visually-grounded words and syntax for a scene description task</dc:title>

    <dc:creator>D Roy</dc:creator>
    <dc:source>Computer Speech and Language (2002)</dc:source>
    <dc:date>2006-09-27T14:08:28-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Computer Speech and Language</prism:publicationName>
    <prism:category>no-tag</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/lschilli/article/875677">
    <title>Towards situated speech understanding: visual context priming of language models</title>
    <link>http://www.citeulike.org/user/lschilli/article/875677</link>
    <description>&lt;i&gt;Computer Speech &#38; Language, Vol. 19, No. 2. (April 2005), pp. 227-248.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Fuse is a situated spoken language understanding system that uses visual context to steer the interpretation of speech. Given a visual scene and a spoken description, the system finds the object in the scene that best fits the meaning of the description. To solve this task, Fuse performs speech recognition and visually-grounded language understanding. Rather than treat these two problems separately, knowledge of the visual semantics of language and the specific contents of the visual scene are fused during speech processing. As a result, the system anticipates various ways a person might describe any object in the scene, and uses these predictions to bias the speech recognizer towards likely sequences of words. A dynamic visual attention mechanism is used to focus processing on likely objects within the scene as spoken utterances are processed. Visual attention and language prediction reinforce one another and converge on interpretations of incoming speech signals which are most consistent with visual context. In evaluations, the introduction of visual context into the speech recognition process results in significantly improved speech recognition and understanding accuracy. The underlying principles of this model may be applied to a wide range of speech understanding problems including mobile and assistive technologies in which contextual information can be sensed and semantically interpreted to bias processing.</description>
    <dc:title>Towards situated speech understanding: visual context priming of language models</dc:title>

    <dc:creator>Deb Roy</dc:creator>
    <dc:creator>Niloy Mukherjee</dc:creator>
    <dc:identifier>doi:10.1016/j.csl.2004.08.003</dc:identifier>
    <dc:source>Computer Speech &#38; Language, Vol. 19, No. 2. (April 2005), pp. 227-248.</dc:source>
    <dc:date>2006-09-27T13:55:18-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Computer Speech &#38; Language</prism:publicationName>
    <prism:volume>19</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>227</prism:startingPage>
    <prism:endingPage>248</prism:endingPage>
    <prism:category>no-tag</prism:category>
</item>



</rdf:RDF>

