<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Thu, 21 Aug 2008 14:17:15 BST</pubDate>


	<title>CiteULike: tgyork's ocr</title>
	<description>CiteULike: tgyork's ocr</description>


	<link>http://www.citeulike.org/user/tgyork/tag/ocr</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/2799352"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/894586"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/2098806"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/1952949"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/816388"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/tgyork/article/1724221"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/tgyork/article/2799352">
    <title>OCR binarization and image pre-processing for searching historical documents</title>
    <link>http://www.citeulike.org/user/tgyork/article/2799352</link>
    <description>&lt;i&gt;Pattern Recognition, Vol. 40, No. 2. (February 2007), pp. 389-397.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We consider the problem of document binarization as a pre-processing step for optical character recognition (OCR) for the purpose of keyword search of historical printed documents. A number of promising techniques from the literature for binarization, pre-filtering, and post-binarization denoising were implemented along with newly developed methods for binarization: an error diffusion binarization, a multiresolutional version of Otsu's binarization, and denoising by despeckling. The OCR in the ABBYY FineReader 7.1 SDK is used as a black box metric to compare methods. Results for 12 pages from six newspapers of differing quality show that performance varies widely by image, but that the classic Otsu method and Otsu-based methods perform best on average.</description>
    <dc:title>OCR binarization and image pre-processing for searching historical documents</dc:title>

    <dc:creator>Maya Gupta</dc:creator>
    <dc:creator>Nathaniel Jacobson</dc:creator>
    <dc:creator>Eric Garcia</dc:creator>
    <dc:identifier>doi:10.1016/j.patcog.2006.04.043</dc:identifier>
    <dc:source>Pattern Recognition, Vol. 40, No. 2. (February 2007), pp. 389-397.</dc:source>
    <dc:date>2008-05-14T15:59:17-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Pattern Recognition</prism:publicationName>
    <prism:volume>40</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>389</prism:startingPage>
    <prism:endingPage>397</prism:endingPage>
    <prism:category>background</prism:category>
    <prism:category>binarisation</prism:category>
    <prism:category>historical</prism:category>
    <prism:category>image-processing</prism:category>
    <prism:category>ocr</prism:category>
    <prism:category>preprocessing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/tgyork/article/894586">
    <title>Gradient-based contour encoding for character recognition</title>
    <link>http://www.citeulike.org/user/tgyork/article/894586</link>
    <description>&lt;i&gt;Pattern Recognition, Vol. 29, No. 7. (July 1996), pp. 1147-1160.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe novel methods of feature extraction for recognition of single isolated character images. Our approach is flexible in that the same algorithms can be used, without modification, for feature extraction in a variety of OCR problems. These include handwritten, machine-print, grayscale, binary and low-resolution character recognition. We use the gradient representation as the basis for extraction of low-level, structural and stroke-type features. These algorithms require a few simple arithmetic operations per image pixel which makes them suitable for real-time applications. A description of the algorithms and experiments with several data sets are presented in this paper. Experimental results using artificial neural networks are presented. Our results demonstrate high performance of these features when tested on data sets distinct from the training data.</description>
    <dc:title>Gradient-based contour encoding for character recognition</dc:title>

    <dc:creator>Geetha Srikantan</dc:creator>
    <dc:creator>Stephen Lam</dc:creator>
    <dc:creator>Sargur Srihari</dc:creator>
    <dc:identifier>doi:10.1016/0031-3203(95)00146-8</dc:identifier>
    <dc:source>Pattern Recognition, Vol. 29, No. 7. (July 1996), pp. 1147-1160.</dc:source>
    <dc:date>2006-10-12T20:22:21-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:publicationName>Pattern Recognition</prism:publicationName>
    <prism:volume>29</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>1147</prism:startingPage>
    <prism:endingPage>1160</prism:endingPage>
    <prism:category>background</prism:category>
    <prism:category>character-based</prism:category>
    <prism:category>features</prism:category>
    <prism:category>ocr</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/tgyork/article/2098806">
    <title>Defining writer's invariants to adapt the recognition task</title>
    <link>http://www.citeulike.org/user/tgyork/article/2098806</link>
    <description>&lt;i&gt;Document Analysis and Recognition, 1999. ICDAR '99. Proceedings of the Fifth International Conference on (1999), pp. 765-768.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Investigates the automatic reading of unconstrained omni-writer handwritten texts. This paper shows how to endow the reading system with adaptation faculties for each writer's handwriting. The adaptation principles are of major importance for making robust decisions when neither simple lexical nor syntactic rules can be used, e.g. for a free lexicon or for full text recognition. The first part of this paper defines the concept of writer's invariants. In the second part, we explain how the recognition system can be adapted to a particular handwriting by exploiting the graphical context defined by the writer's invariants. This adaptation is guaranteed, thanks to the writer's invariants, by activating interaction links over the whole text between the recognition procedures for word entities and those for letter entities</description>
    <dc:title>Defining writer's invariants to adapt the recognition task</dc:title>

    <dc:creator>A Nosary</dc:creator>
    <dc:creator>L Heutte</dc:creator>
    <dc:creator>T Paquet</dc:creator>
    <dc:creator>Y Lecourtier</dc:creator>
    <dc:source>Document Analysis and Recognition, 1999. ICDAR '99. Proceedings of the Fifth International Conference on (1999), pp. 765-768.</dc:source>
    <dc:date>2007-12-12T13:30:46-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publicationName>Document Analysis and Recognition, 1999. ICDAR '99. Proceedings of the Fifth International Conference on</prism:publicationName>
    <prism:startingPage>765</prism:startingPage>
    <prism:endingPage>768</prism:endingPage>
    <prism:category>background</prism:category>
    <prism:category>codebook</prism:category>
    <prism:category>interlending</prism:category>
    <prism:category>invariants</prism:category>
    <prism:category>ocr</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/tgyork/article/1952949">
    <title>A search engine for historical manuscript images</title>
    <link>http://www.citeulike.org/user/tgyork/article/1952949</link>
    <description>&lt;i&gt;(2004), pp. 369-376.&lt;/i&gt;</description>
    <dc:title>A search engine for historical manuscript images</dc:title>

    <dc:creator>Toni Rath</dc:creator>
    <dc:creator>R Manmatha</dc:creator>
    <dc:creator>Victor Lavrenko</dc:creator>
    <dc:identifier>doi:10.1145/1008992.1009056</dc:identifier>
    <dc:source>(2004), pp. 369-376.</dc:source>
    <dc:date>2007-11-21T16:46:20-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:startingPage>369</prism:startingPage>
    <prism:endingPage>376</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>features</prism:category>
    <prism:category>historical</prism:category>
    <prism:category>ocr</prism:category>
    <prism:category>search-engine</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/tgyork/article/816388">
    <title>Feature extraction methods for character recognition-A survey</title>
    <link>http://www.citeulike.org/user/tgyork/article/816388</link>
    <description>&lt;i&gt;Pattern Recognition, Vol. 29, No. 4. (April 1996), pp. 641-662.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents an overview of feature extraction methods for off-line recognition of segmented (isolated) characters. Selection of a feature extraction method is probably the single most important factor in achieving high recognition performance in character recognition systems. Different feature extraction methods are designed for different representations of the characters, such as solid binary characters, character contours, skeletons (thinned characters) or gray-level subimages of each individual character. The feature extraction methods are discussed in terms of invariance properties, reconstructability and expected distortions and variability of the characters. The problem of choosing the appropriate feature extraction method for a given application is also discussed. When a few promising feature extraction methods have been identified, they need to be evaluated experimentally to find the best method for the given application.</description>
    <dc:title>Feature extraction methods for character recognition-A survey</dc:title>

    <dc:creator>Due</dc:creator>
    <dc:creator>Anil Jain</dc:creator>
    <dc:creator>Torfinn Taxt</dc:creator>
    <dc:identifier>doi:10.1016/0031-3203(95)00118-2</dc:identifier>
    <dc:source>Pattern Recognition, Vol. 29, No. 4. (April 1996), pp. 641-662.</dc:source>
    <dc:date>2006-08-25T07:00:22-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:publicationName>Pattern Recognition</prism:publicationName>
    <prism:volume>29</prism:volume>
    <prism:number>4</prism:number>
    <prism:startingPage>641</prism:startingPage>
    <prism:endingPage>662</prism:endingPage>
    <prism:category>character-based</prism:category>
    <prism:category>ocr</prism:category>
    <prism:category>preprocessing</prism:category>
    <prism:category>recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/tgyork/article/1724221">
    <title>Using Dynamic Time Warping for intuitive handwriting recognition</title>
    <link>http://www.citeulike.org/user/tgyork/article/1724221</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>Using Dynamic Time Warping for intuitive handwriting recognition</dc:title>

    <dc:creator>R Niels</dc:creator>
    <dc:creator>L Vuurpijl</dc:creator>
    <dc:date>2007-10-03T14:05:45-00:00</dc:date>
    <prism:category>background</prism:category>
    <prism:category>ocr</prism:category>
    <prism:category>online</prism:category>
    <prism:category>project</prism:category>
</item>



</rdf:RDF>

