<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sat, 26 Jul 2008 04:23:31 BST</pubDate>


	<title>CiteULike: Group: automatic_summarization - library [278 articles]</title>
	<description>CiteULike: Group: automatic_summarization - library [278 articles]</description>


	<link>http://www.citeulike.org/group/114</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/2863680"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1536147"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1535958"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/385864"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1409098"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1408506"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1139248"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/976721"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/977803"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1203840"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1203839"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1203837"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1203830"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/581131"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/948905"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1128847"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/121003"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1126813"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1165265"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1155415"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1155025"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1154930"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1154354"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1154351"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/965070"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/964843"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/965068"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1151036"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1139916"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1139912"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1139906"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1139902"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/832446"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1075713"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/1072329"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/996973"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/965072"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/984042"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/977808"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/977805"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/977802"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/911348"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/957702"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/974355"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/974063"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/973069"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/973036"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/972899"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/967062"/>
        <rdf:li rdf:resource="http://www.citeulike.org/group/114/article/961316"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/group/114/article/2863680">
    <title>SUMMaR: Combining Linguistics and Statistics for Text Summarization</title>
    <link>http://www.citeulike.org/group/114/article/2863680</link>
    <description>&lt;i&gt;Frontiers in Artificial Intelligence and Applications, Vol. 141 (29 August 2006), pp. 827-828.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe a text summarization system that moves beyond standard approaches by using a hybrid approach of linguistic and statistical analysis and by employing text-sort-specific knowledge of document structure and phrases indicating importance. The system is highly modular and entirely XML-based so that different components can be combined easily.</description>
    <dc:title>SUMMaR: Combining Linguistics and Statistics for Text Summarization</dc:title>

    <dc:creator>Manfred Stede</dc:creator>
    <dc:creator>Heike Bieler</dc:creator>
    <dc:creator>Stefanie Dipper</dc:creator>
    <dc:creator>Arthit Suriyawongkul</dc:creator>
    <dc:source>Frontiers in Artificial Intelligence and Applications, Vol. 141 (29 August 2006), pp. 827-828.</dc:source>
    <dc:date>2008-06-05T07:51:34-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Frontiers in Artificial Intelligence and Applications</prism:publicationName>
    <prism:volume>141</prism:volume>
    <prism:startingPage>827</prism:startingPage>
    <prism:endingPage>828</prism:endingPage>
    <prism:publisher>IOS Press</prism:publisher>
    <prism:category>computational-linguistics</prism:category>
    <prism:category>statistics</prism:category>
    <prism:category>summarization</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1536147">
    <title>Learning Visual Similarity Measures for Comparing Never Seen Objects</title>
    <link>http://www.citeulike.org/group/114/article/1536147</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2007. CVPR '07. IEEE Conference on (2007), pp. 1-8.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we propose and evaluate an algorithm that learns a similarity measure for comparing never seen objects. The measure is learned from pairs of training images labeled &#34;same&#34; or &#34;different&#34;. This is far less informative than the commonly used individual image labels (e.g. &#34;car model X&#34;), but it is cheaper to obtain. The proposed algorithm learns the characteristic differences between local descriptors sampled from pairs of &#34;same&#34; and &#34;different&#34; images. These differences are vector quantized by an ensemble of extremely randomized binary trees, and the similarity measure is computed from the quantized differences. The extremely randomized trees are fast to learn, robust due to the redundant information they carry and they have been proved to be very good clusterers. Furthermore, the trees ef ciently combine different feature types (SIFT and geometry). We evaluate our innovative similarity measure on four very different datasets and consistantly outperform the state-of-the-art competitive approaches.</description>
    <dc:title>Learning Visual Similarity Measures for Comparing Never Seen Objects</dc:title>

    <dc:creator>Eric Nowak</dc:creator>
    <dc:creator>Frederic Jurie</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2007. CVPR '07. IEEE Conference on (2007), pp. 1-8.</dc:source>
    <dc:date>2007-08-05T08:24:59-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2007. CVPR '07. IEEE Conference on</prism:publicationName>
    <prism:startingPage>1</prism:startingPage>
    <prism:endingPage>8</prism:endingPage>
    <prism:category>2007</prism:category>
    <prism:category>category-recognition</prism:category>
    <prism:category>cvpr</prism:category>
    <prism:category>metric-learning</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1535958">
    <title>Proximity Distribution Kernels for Geometric Context in Category Recognition</title>
    <link>http://www.citeulike.org/group/114/article/1535958</link>
    <description>&lt;i&gt;(October 2007)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We propose using the proximity distribution of vector quantized local feature descriptors for object and category recognition. To this end, we introduce a novel “proximity distribution kernel” that naturally combines local geometric as well as photometric information from images. It satisfies Mercer’s condition and can therefore be readily combined with a support vector machine to perform visual categorization in a way that is insensitive to photometric and geometric variations, while retaining significant discriminative power. In particular, it improves on the results obtained both with geometrically un-constrained “bags of features” approaches, as well as with over-constrained “affine procrustes.” Indeed, we test this approach on several challenging data sets, including Graz-01, Graz-02, and the PASCAL challenge, and in all tests it outperforms all previously proposed approaches. We registered the average performance at 91.5% on Graz-01, 82.7% on Graz-02, and 74.5% on PASCAL. Our approach is designed to enforce and exploit geometric consistency among objects in the same category; therefore, it does not improve the performance of existing algorithms on datasets where the data is already roughly aligned and scaled. Our method has the potential to be extended to more complex geometric relationships among local features, as we illustrate in the experiments.</description>
    <dc:title>Proximity Distribution Kernels for Geometric Context in Category Recognition</dc:title>

    <dc:creator>Haibin Ling</dc:creator>
    <dc:creator>Stefano Soato</dc:creator>
    <dc:source>(October 2007)</dc:source>
    <dc:date>2007-08-05T05:53:51-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>2007</prism:category>
    <prism:category>category-recognition</prism:category>
    <prism:category>iccv</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>spatial-pyramid-matching</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/385864">
    <title>Learning distance functions for image retrieval</title>
    <link>http://www.citeulike.org/group/114/article/385864</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2004. CVPR 2004. Proceedings of the 2004 IEEE Computer Society Conference on, Vol. 2 (2004), pp. II-570-II-577 Vol.2.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Image retrieval critically relies on the distance function used to compare a query image to images in the database. We suggest learning such distance functions by training binary classifiers with margins, where the classifiers are defined over the product space of pairs of images. The classifiers are trained to distinguish between pairs in which the images are from the same class and pairs, which contain images from different classes. The signed margin is used as a distance function. We explore several variants of this idea, based on using SVM and boosting algorithms as product space classifiers. Our main contribution is a distance learning method, which combines boosting hypotheses over the product space with a weak learner based on partitioning the original feature space. The weak learner used is a Gaussian mixture model computed using a constrained EM algorithm, where the constraints are equivalence constraints on pairs of data points. This approach allows us to incorporate unlabeled data into the training process. Using some benchmark databases from the UCI repository, we show that our margin based methods significantly outperform existing metric learning methods, which are based an learning a Mahalanobis distance. We then show comparative results of image retrieval in a distributed learning paradigm, using two databases: a large database of facial images (YaleB), and a database of natural images taken from a commercial CD. In both cases our GMM based boosting method outperforms all other methods, and its generalization to unseen classes is superior.</description>
    <dc:title>Learning distance functions for image retrieval</dc:title>

    <dc:creator>T Hertz</dc:creator>
    <dc:creator>A Bar-Hillel</dc:creator>
    <dc:creator>D Weinshall</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2004. CVPR 2004. Proceedings of the 2004 IEEE Computer Society Conference on, Vol. 2 (2004), pp. II-570-II-577 Vol.2.</dc:source>
    <dc:date>2005-11-09T18:14:24-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2004. CVPR 2004. Proceedings of the 2004 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:startingPage>II-570</prism:startingPage>
    <prism:endingPage>II-577 Vol.2</prism:endingPage>
    <prism:category>learning</prism:category>
    <prism:category>metric-learning</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1409098">
    <title>On learning asymmetric dissimilarity measures</title>
    <link>http://www.citeulike.org/group/114/article/1409098</link>
    <description>&lt;i&gt;Data Mining, Fifth IEEE International Conference on (2005), 4 pp..&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Many practical applications require that distance measures to be asymmetric and context-sensitive. We introduce context-sensitive learnable asymmetric dissimilarity (CLAD) measures, which are defined to be a weighted sum of a fixed number of dissimilarity measures where the associated weights depend on the point from which the dissimilarity is measured. The parameters used in defining the measure capture the global relationships among the features. We provide an algorithm to learn the dissimilarity measure automatically from a set of user specified comparisons in the form &#34;x is closer to y than to z&#34; and study its performance. The experimental results show that the proposed algorithm outperforms other approaches due to the context sensitive nature of the CLAD measures.</description>
    <dc:title>On learning asymmetric dissimilarity measures</dc:title>

    <dc:creator>K Kummamuru</dc:creator>
    <dc:creator>R Krishnapuram</dc:creator>
    <dc:creator>R Agrawal</dc:creator>
    <dc:source>Data Mining, Fifth IEEE International Conference on (2005), 4 pp..</dc:source>
    <dc:date>2007-06-24T13:09:22-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Data Mining, Fifth IEEE International Conference on</prism:publicationName>
    <prism:startingPage>4 pp.</prism:startingPage>
    <prism:category>learning</prism:category>
    <prism:category>metric-learning</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1408506">
    <title>Dynamic visual attention model in image sequences</title>
    <link>http://www.citeulike.org/group/114/article/1408506</link>
    <description>&lt;i&gt;Image Vision Comput., Vol. 25, No. 5. (May 2007), pp. 597-613.&lt;/i&gt;</description>
    <dc:title>Dynamic visual attention model in image sequences</dc:title>

    <dc:creator>Mar&#38;\#237;a L&#38;\#243;pez</dc:creator>
    <dc:creator>Miguel Fern&#38;\#225;ndez</dc:creator>
    <dc:creator>Antonio Fern&#38;\#225;ndez-Caballero</dc:creator>
    <dc:creator>Jos&#38;\#233; Mira</dc:creator>
    <dc:creator>Ana Delgado</dc:creator>
    <dc:identifier>doi:10.1016/j.imavis.2006.05.004</dc:identifier>
    <dc:source>Image Vision Comput., Vol. 25, No. 5. (May 2007), pp. 597-613.</dc:source>
    <dc:date>2007-06-24T01:58:40-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Image Vision Comput.</prism:publicationName>
    <prism:issn>0262-8856</prism:issn>
    <prism:volume>25</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>597</prism:startingPage>
    <prism:endingPage>613</prism:endingPage>
    <prism:publisher>Butterworth-Heinemann</prism:publisher>
    <prism:category>attention</prism:category>
    <prism:category>survey</prism:category>
    <prism:category>video_attention</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1139248">
    <title>Text Classification from Labeled and Unlabeled Documents using EM</title>
    <link>http://www.citeulike.org/group/114/article/1139248</link>
    <description>&lt;i&gt;Machine Learning, Vol. V39, No. 2. (1 May 2000), pp. 103-134.&lt;/i&gt;</description>
    <dc:title>Text Classification from Labeled and Unlabeled Documents using EM</dc:title>

    <dc:creator>Kamal Nigam</dc:creator>
    <dc:creator>Andrew Mccallum</dc:creator>
    <dc:creator>Sebastian Thrun</dc:creator>
    <dc:creator>Tom Mitchell</dc:creator>
    <dc:identifier>doi:10.1023/A:1007692713085</dc:identifier>
    <dc:source>Machine Learning, Vol. V39, No. 2. (1 May 2000), pp. 103-134.</dc:source>
    <dc:date>2007-03-04T04:25:56-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publicationName>Machine Learning</prism:publicationName>
    <prism:volume>V39</prism:volume>
    <prism:number>2</prism:number>
    <prism:startingPage>103</prism:startingPage>
    <prism:endingPage>134</prism:endingPage>
    <prism:category>em</prism:category>
    <prism:category>semi-supervised</prism:category>
    <prism:category>semi-supervised-learning</prism:category>
    <prism:category>text-classification</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/976721">
    <title>Bayesian Sets</title>
    <link>http://www.citeulike.org/group/114/article/976721</link>
    <description>&lt;i&gt;(2005)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Inspired by &#34;Google Sets&#34;, we consider the problem of retrieving items from a concept or cluster, given a query consisting of a few items from that cluster. We formulate this as a Bayesian inference problem and describe a very simple algorithm for solving it. Our algorithm uses a modelbased concept of a cluster and ranks items using a score which evaluates the marginal probability that each item belongs to a cluster containing the query items. For exponential family models with...</description>
    <dc:title>Bayesian Sets</dc:title>

    <dc:creator>Z Ghahramani</dc:creator>
    <dc:creator>KA Heller</dc:creator>
    <dc:source>(2005)</dc:source>
    <dc:date>2006-12-06T13:41:10-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:category>bayesian</prism:category>
    <prism:category>graphical-model</prism:category>
    <prism:category>learning</prism:category>
    <prism:category>statistical-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/977803">
    <title>A Simple Bayesian Framework for Content-Based Image Retrieval</title>
    <link>http://www.citeulike.org/group/114/article/977803</link>
    <description>&lt;i&gt;(2006), pp. 2110-2117.&lt;/i&gt;</description>
    <dc:title>A Simple Bayesian Framework for Content-Based Image Retrieval</dc:title>

    <dc:creator>Katherine Heller</dc:creator>
    <dc:creator>Zoubin Ghahramani</dc:creator>
    <dc:identifier>doi:10.1109/CVPR.2006.41</dc:identifier>
    <dc:source>(2006), pp. 2110-2117.</dc:source>
    <dc:date>2006-12-07T12:31:00-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>2110</prism:startingPage>
    <prism:endingPage>2117</prism:endingPage>
    <prism:publisher>IEEE Computer Society</prism:publisher>
    <prism:category>bayesian</prism:category>
    <prism:category>graphical-model</prism:category>
    <prism:category>learning</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>retrieval</prism:category>
    <prism:category>statistical-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1203840">
    <title>Learning to Locate Informative Features for Visual Identification</title>
    <link>http://www.citeulike.org/group/114/article/1203840</link>
    <description>&lt;i&gt;International Journal of Computer Vision (2006)&lt;/i&gt;</description>
    <dc:title>Learning to Locate Informative Features for Visual Identification</dc:title>

    <dc:creator>Andras Ferencz</dc:creator>
    <dc:creator>Erik Learned-Miller</dc:creator>
    <dc:creator>Jitendra Malik</dc:creator>
    <dc:source>International Journal of Computer Vision (2006)</dc:source>
    <dc:date>2007-04-03T08:25:51-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>International Journal of Computer Vision</prism:publicationName>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>segmentation</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1203839">
    <title>Discriminative Training of Hyper-feature Models for Object Identification</title>
    <link>http://www.citeulike.org/group/114/article/1203839</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Discriminative Training of Hyper-feature Models for Object Identification</dc:title>

    <dc:creator>Vidit Jain</dc:creator>
    <dc:creator>Andras Ferencz</dc:creator>
    <dc:creator>Erik Learned-Miller</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-04-03T08:24:34-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>segmentation</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1203837">
    <title>Learning Hyper-Features for Visual Identification</title>
    <link>http://www.citeulike.org/group/114/article/1203837</link>
    <description>&lt;i&gt;Vol. 18 (2004)&lt;/i&gt;</description>
    <dc:title>Learning Hyper-Features for Visual Identification</dc:title>

    <dc:creator>Andras Ferencz</dc:creator>
    <dc:creator>Erik Learned-Miller</dc:creator>
    <dc:creator>Jitendra Malik</dc:creator>
    <dc:source>Vol. 18 (2004)</dc:source>
    <dc:date>2007-04-03T08:20:33-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:volume>18</prism:volume>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>segmentation</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1203830">
    <title>Building a classification cascade for visual identification from one example</title>
    <link>http://www.citeulike.org/group/114/article/1203830</link>
    <description>&lt;i&gt;Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 1 (2005), pp. 286-293 Vol. 1.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Object identification (OID) is specialized recognition where the category is known (e.g. cars) and the algorithm recognizes an object's exact identity (e.g. Bob's BMW). Two special challenges characterize OID. (1) Interclass variation is often small (many cars look alike) and may be dwarfed by illumination or pose changes. (2) There may be many classes but few or just one positive &#34;training&#34; examples per class. Due to (1), a solution must locate possibly subtle object-specific salient features (a door handle) while avoiding distracting ones (a specular highlight). However, (2) rules out direct techniques of feature selection. We describe an online algorithm that takes one model image from a known category and builds an efficient &#34;same&#34; vs. &#34;different&#34; classification cascade by predicting the most discriminative feature set for that object. Our method not only estimates the saliency and scoring function for each candidate feature, but also models the dependency between features, building an ordered feature sequence unique to a specific model image, maximizing cumulative information content. Learned stopping thresholds make the classifier very efficient. To make this possible, category-specific characteristics are learned automatically in an off-line training procedure from labeled image pairs of the category, without prior knowledge about the category. Our method, using the same algorithm for both cars and faces, outperforms a wide variety of other methods.</description>
    <dc:title>Building a classification cascade for visual identification from one example</dc:title>

    <dc:creator>A Ferencz</dc:creator>
    <dc:creator>EG Learned-Miller</dc:creator>
    <dc:creator>J Malik</dc:creator>
    <dc:source>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 1 (2005), pp. 286-293 Vol. 1.</dc:source>
    <dc:date>2007-04-03T08:12:27-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>286</prism:startingPage>
    <prism:endingPage>293 Vol. 1</prism:endingPage>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-identification</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>spatial-relationship</prism:category>
    <prism:category>statistical-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/581131">
    <title>Hyperfeatures - Multilevel Local Coding for Visual Recognition</title>
    <link>http://www.citeulike.org/group/114/article/581131</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Histograms of local appearance descriptors are a popular representation for visual recognition. They are highly discriminant and they have good resistance to local occlusions and to geometric and photometric variations, but they are not able to exploit spatial co-occurrence statistics of features at scales larger than their local input patches. We present a new multilevel visual representation, `hyperfeatures', that is designed to remedy this. The basis of the work is the familiar notion that to detect object parts, in practice it often suffices to detect co-occurrences of more local object fragments – a process that can be formalized as comparison (vector quantization) of image patches against a codebook of known fragments, followed by local aggregation of the resulting codebook membership vectors to detect co-occurrences. This process converts collections of local image descriptor vectors into slightly less local histogram vectors – higher-level but spatially coarser descriptors. Our central observation is that it can therefore be iterated, and that doing so captures and codes ever larger assemblies of object parts and increasingly abstract or `semantic' image properties. This repeated nonlinear `folding' is essentially different from that of hierarchical models such as Convolutional Neural Networks and HMAX, being based on repeated comparison to local prototypes and accumulation of co-occurrence statistics rather than on repeated convolution and rectification. We formulate the hyperfeatures model and study its performance under several different image coding methods including clustering based Vector Quantization, Gaussian Mixtures, and combinations of these with Latent Discriminant Analysis. We find that the resulting high-level features provide improved performance in several object image and texture image classification tasks.</description>
    <dc:title>Hyperfeatures - Multilevel Local Coding for Visual Recognition</dc:title>

    <dc:creator>Ankur Agarwal</dc:creator>
    <dc:creator>William Triggs</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2006-04-10T15:37:34-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>bag-of-features</prism:category>
    <prism:category>hyperfeature</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/948905">
    <title>Using Multiple Segmentations to Discover Objects and their Extent in Image Collections</title>
    <link>http://www.citeulike.org/group/114/article/948905</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Using Multiple Segmentations to Discover Objects and their Extent in Image Collections</dc:title>

    <dc:creator>BC Russell</dc:creator>
    <dc:creator>AA Efros</dc:creator>
    <dc:creator>J Sivic</dc:creator>
    <dc:creator>WT Freeman</dc:creator>
    <dc:creator>A Zisserman</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2006-11-16T14:33:58-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>segmentation</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1128847">
    <title>Pictorial Structures for Object Recognition</title>
    <link>http://www.citeulike.org/group/114/article/1128847</link>
    <description>&lt;i&gt;International Journal of Computer Vision, Vol. V61, No. 1. (1 January 2005), pp. 55-79.&lt;/i&gt;</description>
    <dc:title>Pictorial Structures for Object Recognition</dc:title>

    <dc:creator>Pedro Felzenszwalb</dc:creator>
    <dc:creator>Daniel Huttenlocher</dc:creator>
    <dc:identifier>doi:10.1023/B:VISI.0000042934.15159.49</dc:identifier>
    <dc:source>International Journal of Computer Vision, Vol. V61, No. 1. (1 January 2005), pp. 55-79.</dc:source>
    <dc:date>2007-02-28T06:10:54-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>International Journal of Computer Vision</prism:publicationName>
    <prism:volume>V61</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>55</prism:startingPage>
    <prism:endingPage>79</prism:endingPage>
    <prism:category>bag-of-feature</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/121003">
    <title>Unbalanced region matching based on two-level description for image retrieval</title>
    <link>http://www.citeulike.org/group/114/article/121003</link>
    <description>&lt;i&gt;Pattern Recognition Letters, Vol. 26, No. 5. (April 2005), pp. 565-580.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Research on integrating spatial information into content-based image retrieval (CBIR) is aimed at solving the problem caused by global feature based algorithm. Most systems derive the spatial information from image segmentation. However, the description of images based on one-level segmentation (OLD) and the inevitable inaccuracy of segmentation results seriously limit the performance. A two-level description (TLD) describes images by a rough description and a detailed description to avoid improper spatial constraint caused by OLD is proposed. Similarity measurement based on unbalanced region matching (URM) is introduced to take advantage of TLD to reduce the influence of segmentation. A novel spatial descriptor integrating shape, size, and density as well as position and spatial layout information together is also proposed. The performance of the integrated system is illustrated by experimental results with 1000 query images randomly selected from a database of 10,000 general-purpose images.</description>
    <dc:title>Unbalanced region matching based on two-level description for image retrieval</dc:title>

    <dc:creator>Sheng-Yang Dai</dc:creator>
    <dc:creator>Yu-Jin Zhang</dc:creator>
    <dc:identifier>doi:10.1016/j.patrec.2004.08.022</dc:identifier>
    <dc:source>Pattern Recognition Letters, Vol. 26, No. 5. (April 2005), pp. 565-580.</dc:source>
    <dc:date>2005-03-11T09:34:09-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Pattern Recognition Letters</prism:publicationName>
    <prism:volume>26</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>565</prism:startingPage>
    <prism:endingPage>580</prism:endingPage>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>recognition</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1126813">
    <title>Object class recognition by unsupervised scale-invariant learning</title>
    <link>http://www.citeulike.org/group/114/article/1126813</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2003. Proceedings. 2003 IEEE Computer Society Conference on, Vol. 2 (2003), pp. II-264-II-271 vol.2.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a method to learn and recognize object class models from unlabeled and unsegmented cluttered scenes in a scale invariant manner. Objects are modeled as flexible constellations of parts. A probabilistic representation is used for all aspects of the object: shape, appearance, occlusion and relative scale. An entropy-based feature detector is used to select regions and their scale within the image. In learning the parameters of the scale-invariant object model are estimated. This is done using expectation-maximization in a maximum-likelihood setting. In recognition, this model is used in a Bayesian manner to classify images. The flexible nature of the model is demonstrated by excellent results over a range of datasets including geometrically constrained classes (e.g. faces, cars) and flexible objects (such as animals).</description>
    <dc:title>Object class recognition by unsupervised scale-invariant learning</dc:title>

    <dc:creator>R Fergus</dc:creator>
    <dc:creator>P Perona</dc:creator>
    <dc:creator>A Zisserman</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2003. Proceedings. 2003 IEEE Computer Society Conference on, Vol. 2 (2003), pp. II-264-II-271 vol.2.</dc:source>
    <dc:date>2007-02-27T10:24:47-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2003. Proceedings. 2003 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:startingPage>II-264</prism:startingPage>
    <prism:endingPage>II-271 vol.2</prism:endingPage>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1165265">
    <title>Learning Saliency Maps for Object Categorization</title>
    <link>http://www.citeulike.org/group/114/article/1165265</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Learning Saliency Maps for Object Categorization</dc:title>

    <dc:creator>Frank Moosmann</dc:creator>
    <dc:creator>Diane Larlus</dc:creator>
    <dc:creator>Frederic Jurie</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-03-15T10:16:03-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>attention</prism:category>
    <prism:category>bag-of-feature</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1155415">
    <title>Object modeling and recognition using local affine-invariant image descriptors and multi-view spatial contraints</title>
    <link>http://www.citeulike.org/group/114/article/1155415</link>
    <description>&lt;i&gt;International Journal of Computer Vision, Vol. 66, No. 3. (2006)&lt;/i&gt;</description>
    <dc:title>Object modeling and recognition using local affine-invariant image descriptors and multi-view spatial contraints</dc:title>

    <dc:creator>F Rothganger</dc:creator>
    <dc:creator>Svetlana Lazebnik</dc:creator>
    <dc:creator>Cordelia Schmid</dc:creator>
    <dc:creator>Jean Ponce</dc:creator>
    <dc:source>International Journal of Computer Vision, Vol. 66, No. 3. (2006)</dc:source>
    <dc:date>2007-03-12T13:44:47-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>International Journal of Computer Vision</prism:publicationName>
    <prism:volume>66</prism:volume>
    <prism:number>3</prism:number>
    <prism:category>bag-of-feature</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1155025">
    <title>On-Line Construction of Compact Directed Acyclic Word Graphs</title>
    <link>http://www.citeulike.org/group/114/article/1155025</link>
    <description>&lt;i&gt;Lecture Notes in Computer Science, Vol. 2089 (2001)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Directed Acyclic Word Graph (DAWG) is a space efficient data structure that supports indices of a string. Compact Directed Acyclic Word Graph (CDAWG) is a more space efficient variant of DAWG. Crochemore and Verin gave the first direct algorithm to construct CDAWGs from given strings, based on the McCreight's algorithm for suffix trees. In this paper, we give an Ukkonen's counterpart for CDAWGs. That is, we show an on-line algorithm that constructs CDAWGs from given strings directly.</description>
    <dc:title>On-Line Construction of Compact Directed Acyclic Word Graphs</dc:title>

    <dc:creator>Shunsuke Inenaga</dc:creator>
    <dc:creator>Hiromasa Hoshino</dc:creator>
    <dc:creator>Ayumi Shinohara</dc:creator>
    <dc:creator>Masayuki Takeda</dc:creator>
    <dc:creator>Setsuo Arikawa</dc:creator>
    <dc:creator>Giancarlo Mauri</dc:creator>
    <dc:creator>Giulio Pavesi</dc:creator>
    <dc:source>Lecture Notes in Computer Science, Vol. 2089 (2001)</dc:source>
    <dc:date>2007-03-12T07:17:04-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publicationName>Lecture Notes in Computer Science</prism:publicationName>
    <prism:volume>2089</prism:volume>
    <prism:category>compact</prism:category>
    <prism:category>dawg</prism:category>
    <prism:category>trie</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1154930">
    <title>Fast Practical Multi-Pattern Matching</title>
    <link>http://www.citeulike.org/group/114/article/1154930</link>
    <description>&lt;i&gt;Information Processing Letters, Vol. 71, No. 3-4. (1999), pp. 107-113.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The main result of the paper is the construction of a very fast multi-pattern matching algorithm, called DAWG-MATCH. The algorithm is of Boyer-Moore type. Previous algorithm of this type is the Commentz-Walter algorithm. The DAWG-MATCH algorithm behaves better than Commentz-Walter algorithm. We combine the ideas of two algorithms: the Aho-Corasick algorithm, and the Reverse Factor algorithm from Crochemore et alii. The new algorithm performs at most 2jtextj inspections of text characters, and...</description>
    <dc:title>Fast Practical Multi-Pattern Matching</dc:title>

    <dc:creator>Maxime Crochemore</dc:creator>
    <dc:creator>Artur Czumaj</dc:creator>
    <dc:creator>Leszek Gasieniec</dc:creator>
    <dc:creator>Thierry Lecroq</dc:creator>
    <dc:creator>Wojciech Plandowski</dc:creator>
    <dc:creator>Wojciech Rytter</dc:creator>
    <dc:source>Information Processing Letters, Vol. 71, No. 3-4. (1999), pp. 107-113.</dc:source>
    <dc:date>2007-03-12T06:15:04-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publicationName>Information Processing Letters</prism:publicationName>
    <prism:volume>71</prism:volume>
    <prism:number>3-4</prism:number>
    <prism:startingPage>107</prism:startingPage>
    <prism:endingPage>113</prism:endingPage>
    <prism:category>dawg</prism:category>
    <prism:category>matching</prism:category>
    <prism:category>pattern-matching</prism:category>
    <prism:category>string-matching</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1154354">
    <title>Fast text searching for regular expressions or automaton searching on tries</title>
    <link>http://www.citeulike.org/group/114/article/1154354</link>
    <description>&lt;i&gt;Journal of the ACM, Vol. 43, No. 6. (1996), pp. 915-936.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present algorithms for efficient searching of regular expressions on preprocessed text, using a Patricia tree as a logical model for the index. We obtain searching algorithms which run in logarithmic expected time in the size of the text for a wide subclass of regular expressions, and in sublinear expected time for any regular expression. This is the first such algorithm to be found with this complexity. 1 Introduction Pattern matching and text searching are very important components of...</description>
    <dc:title>Fast text searching for regular expressions or automaton searching on tries</dc:title>

    <dc:creator>Richardo</dc:creator>
    <dc:creator>Gaston Gonnet</dc:creator>
    <dc:source>Journal of the ACM, Vol. 43, No. 6. (1996), pp. 915-936.</dc:source>
    <dc:date>2007-03-11T19:34:51-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:publicationName>Journal of the ACM</prism:publicationName>
    <prism:volume>43</prism:volume>
    <prism:number>6</prism:number>
    <prism:startingPage>915</prism:startingPage>
    <prism:endingPage>936</prism:endingPage>
    <prism:category>matching</prism:category>
    <prism:category>regular-expression</prism:category>
    <prism:category>search</prism:category>
    <prism:category>string</prism:category>
    <prism:category>text</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1154351">
    <title>Multiple Pattern Matching in LZW Compressed Text</title>
    <link>http://www.citeulike.org/group/114/article/1154351</link>
    <description>&lt;i&gt;(1998), pp. 103-112.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper we address the problem of searching in LZW compressed text directly, and present a new algorithm for finding multiple patterns bysimulating the moveofthe Aho-Corasick pattern matching machine. The new algorithm finds all occurrences of multiple patterns whereas the algorithm proposed by Amir, Benson, and Farach finds only the first occurrence of a single pattern.</description>
    <dc:title>Multiple Pattern Matching in LZW Compressed Text</dc:title>

    <dc:creator>Takuya Kida</dc:creator>
    <dc:creator>Masayuki Takeda</dc:creator>
    <dc:creator>Ayumi Shinohara</dc:creator>
    <dc:creator>Masamichi Miyazaki</dc:creator>
    <dc:creator>Setsuo Arikawa</dc:creator>
    <dc:source>(1998), pp. 103-112.</dc:source>
    <dc:date>2007-03-11T19:25:34-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:startingPage>103</prism:startingPage>
    <prism:endingPage>112</prism:endingPage>
    <prism:category>lzw</prism:category>
    <prism:category>matching</prism:category>
    <prism:category>pattern</prism:category>
    <prism:category>search</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/965070">
    <title>Shape matching and object recognition using low distortion correspondences</title>
    <link>http://www.citeulike.org/group/114/article/965070</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2005. CVPR 2005. IEEE Computer Society Conference on, Vol. 1 (2005), pp. 26-33 vol. 1.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We approach recognition in the framework of deformable shape matching, relying on a new algorithm for finding correspondences between feature points. This algorithm sets up correspondence as an integer quadratic programming problem, where the cost function has terms based on similarity of corresponding geometric blur point descriptors as well as the geometric distortion between pairs of corresponding feature points. The algorithm handles outliers, and thus enables matching of exemplars to query images in the presence of occlusion and clutter. Given the correspondences, we estimate an aligning transform, typically a regularized thin plate spline, resulting in a dense correspondence between the two shapes. Object recognition is then handled in a nearest neighbor framework where the distance between exemplar and query is the matching cost between corresponding points. We show results on two datasets. One is the Caltech 101 dataset (Fei-Fei, Fergus and Perona), an extremely challenging dataset with large intraclass variation. Our approach yields a 48% correct classification rate, compared to Fei-Fei et al 's 16%. We also show results for localizing frontal and profile faces that are comparable to special purpose approaches tuned to faces.</description>
    <dc:title>Shape matching and object recognition using low distortion correspondences</dc:title>

    <dc:creator>AC Berg</dc:creator>
    <dc:creator>TL Berg</dc:creator>
    <dc:creator>J Malik</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2005. CVPR 2005. IEEE Computer Society Conference on, Vol. 1 (2005), pp. 26-33 vol. 1.</dc:source>
    <dc:date>2006-11-28T09:36:00-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2005. CVPR 2005. IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>26</prism:startingPage>
    <prism:endingPage>33 vol. 1</prism:endingPage>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/964843">
    <title>Local Features for Object Class Recognition</title>
    <link>http://www.citeulike.org/group/114/article/964843</link>
    <description>&lt;i&gt;(2005), pp. 1792-1799.&lt;/i&gt;</description>
    <dc:title>Local Features for Object Class Recognition</dc:title>

    <dc:creator>Krystian Mikolajczyk</dc:creator>
    <dc:creator>Bastian Leibe</dc:creator>
    <dc:creator>Bernt Schiele</dc:creator>
    <dc:identifier>doi:10.1109/ICCV.2005.146</dc:identifier>
    <dc:source>(2005), pp. 1792-1799.</dc:source>
    <dc:date>2006-11-28T06:57:43-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:startingPage>1792</prism:startingPage>
    <prism:endingPage>1799</prism:endingPage>
    <prism:publisher>IEEE Computer Society</prism:publisher>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/965068">
    <title>Multiclass Object Recognition with Sparse, Localized Features</title>
    <link>http://www.citeulike.org/group/114/article/965068</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 11-18.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We apply a biologically inspired model of visual object recognition to the multiclass object categorization problem. Our model modifies that of Serre, Wolf, and Poggio. As in that work, we first apply Gabor filters at all positions and scales; feature complexity and position/scale invariance are then built up by alternating template matching and max pooling operations. We refine the approach in several biologically plausible ways, using simple versions of sparsification and lateral inhibition. We demonstrate the value of retaining some position and scale information above the intermediate feature level. Using feature selection we arrive at a model that performs better with fewer features. Our final model is tested on the Caltech 101 object categories and the UIUC car localization task, in both cases achieving state-of-the-art performance. The results strengthen the case for using this class of model in computer vision.</description>
    <dc:title>Multiclass Object Recognition with Sparse, Localized Features</dc:title>

    <dc:creator>J Mutch</dc:creator>
    <dc:creator>DG Lowe</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 11-18.</dc:source>
    <dc:date>2006-11-28T09:34:06-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>11</prism:startingPage>
    <prism:endingPage>18</prism:endingPage>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1151036">
    <title>Spatial weighting for bag-of-features</title>
    <link>http://www.citeulike.org/group/114/article/1151036</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Spatial weighting for bag-of-features</dc:title>

    <dc:creator>Marcin Marszałek</dc:creator>
    <dc:creator>Cordelia Schmid</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-03-09T11:27:24-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>bag-of-features</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
    <prism:category>spatial-relationship</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1139916">
    <title>The Layout Consistent Random Field for Recognizing and Segmenting Partially Occluded Objects</title>
    <link>http://www.citeulike.org/group/114/article/1139916</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 37-44.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper addresses the problem of detecting and segmenting partially occluded objects of a known category. We first define a part labelling which densely covers the object. Our Layout Consistent Random Field (LayoutCRF) model then imposes asymmetric local spatial constraints on these labels to ensure the consistent layout of parts whilst allowing for object deformation. Arbitrary occlusions of the object are handled by avoiding the assumption that the whole object is visible. The resulting system is both efficient to train and to apply to novel images, due to a novel annealed layout-consistent expansion move algorithm paired with a randomised decision tree classifier. We apply our technique to images of cars and faces and demonstrate state-of-the-art detection and segmentation performance even in the presence of partial occlusion.</description>
    <dc:title>The Layout Consistent Random Field for Recognizing and Segmenting Partially Occluded Objects</dc:title>

    <dc:creator>J Winn</dc:creator>
    <dc:creator>J Shotton</dc:creator>
    <dc:identifier>doi:10.1109/CVPR.2006.305</dc:identifier>
    <dc:source>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 37-44.</dc:source>
    <dc:date>2007-03-04T15:45:24-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>37</prism:startingPage>
    <prism:endingPage>44</prism:endingPage>
    <prism:category>co-algorithm</prism:category>
    <prism:category>graphical-model</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>random-field</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1139912">
    <title>Located Hidden Random Fields: Learning Discriminative Parts for Object Detection</title>
    <link>http://www.citeulike.org/group/114/article/1139912</link>
    <description>&lt;i&gt;Vol. 3 (2006)&lt;/i&gt;</description>
    <dc:title>Located Hidden Random Fields: Learning Discriminative Parts for Object Detection</dc:title>

    <dc:creator>Ashish Kapoor</dc:creator>
    <dc:creator>John Winn</dc:creator>
    <dc:source>Vol. 3 (2006)</dc:source>
    <dc:date>2007-03-04T15:41:47-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:volume>3</prism:volume>
    <prism:category>graphical-model</prism:category>
    <prism:category>object-detection</prism:category>
    <prism:category>random-field</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1139906">
    <title>Object categorization by learned universal visual dictionary</title>
    <link>http://www.citeulike.org/group/114/article/1139906</link>
    <description>&lt;i&gt;Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 2 (2005), pp. 1800-1807 Vol. 2.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents a new algorithm for the automatic recognition of object classes from images (categorization). Compact and yet discriminative appearance-based object class models are automatically learned from a set of training images. The method is simple and extremely fast, making it suitable for many applications such as semantic image retrieval, Web search, and interactive image editing. It classifies a region according to the proportions of different visual words (clusters in feature space). The specific visual words and the typical proportions in each object are learned from a segmented training set. The main contribution of this paper is twofold: i) an optimally compact visual dictionary is learned by pair-wise merging of visual words from an initially large dictionary. The final visual words are described by GMMs. ii) A novel statistical measure of discrimination is proposed which is optimized by each merge operation. High classification accuracy is demonstrated for nine object classes on photographs of real objects viewed under general lighting conditions, poses and viewpoints. The set of test images used for validation comprise: i) photographs acquired by us, ii) images from the Web and iii) images from the recently released Pascal dataset. The proposed algorithm performs well on both texture-rich objects (e.g. grass, sky, trees) and structure-rich ones (e.g. cars, bikes, planes).</description>
    <dc:title>Object categorization by learned universal visual dictionary</dc:title>

    <dc:creator>J Winn</dc:creator>
    <dc:creator>A Criminisi</dc:creator>
    <dc:creator>T Minka</dc:creator>
    <dc:source>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 2 (2005), pp. 1800-1807 Vol. 2.</dc:source>
    <dc:date>2007-03-04T15:37:13-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:startingPage>1800</prism:startingPage>
    <prism:endingPage>1807 Vol. 2</prism:endingPage>
    <prism:category>graphical-model</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1139902">
    <title>LOCUS: learning object classes with unsupervised segmentation</title>
    <link>http://www.citeulike.org/group/114/article/1139902</link>
    <description>&lt;i&gt;Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 1 (2005), pp. 756-763 Vol. 1.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We address the problem of learning object class models and object segmentations from unannotated images. We introduce LOCUS (learning object classes with unsupervised segmentation) which uses a generative probabilistic model to combine bottom-up cues of color and edge with top-down cues of shape and pose. A key aspect of this model is that the object appearance is allowed to vary from image to image, allowing for significant within-class variation. By iteratively updating the belief in the object's position, size, segmentation and pose, LOCUS avoids making hard decisions about any of these quantities and so allows for each to be refined at any stage. We show that LOCUS successfully learns an object class model from unlabeled images, whilst also giving segmentation accuracies that rival existing supervised methods. Finally, we demonstrate simultaneous recognition and segmentation in novel images using the learned models for a number of object classes, as well as unsupervised object discovery and tracking in video.</description>
    <dc:title>LOCUS: learning object classes with unsupervised segmentation</dc:title>

    <dc:creator>J Winn</dc:creator>
    <dc:creator>N Jojic</dc:creator>
    <dc:identifier>doi:10.1109/ICCV.2005.148</dc:identifier>
    <dc:source>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on, Vol. 1 (2005), pp. 756-763 Vol. 1.</dc:source>
    <dc:date>2007-03-04T15:31:34-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Computer Vision, 2005. ICCV 2005. Tenth IEEE International Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>756</prism:startingPage>
    <prism:endingPage>763 Vol. 1</prism:endingPage>
    <prism:category>graphical-model</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/832446">
    <title>Modeling annotated data</title>
    <link>http://www.citeulike.org/group/114/article/832446</link>
    <description>&lt;i&gt;(2003), pp. 127-134.&lt;/i&gt;</description>
    <dc:title>Modeling annotated data</dc:title>

    <dc:creator>David Blei</dc:creator>
    <dc:creator>Michael Jordan</dc:creator>
    <dc:identifier>doi:10.1145/860435.860460</dc:identifier>
    <dc:source>(2003), pp. 127-134.</dc:source>
    <dc:date>2006-09-06T15:07:16-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:startingPage>127</prism:startingPage>
    <prism:endingPage>134</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>graphical-model</prism:category>
    <prism:category>learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1075713">
    <title>Clustering Appearance and Shape by Learning Jigsaws</title>
    <link>http://www.citeulike.org/group/114/article/1075713</link>
    <description>&lt;i&gt;Vol. 19 (2006)&lt;/i&gt;</description>
    <dc:title>Clustering Appearance and Shape by Learning Jigsaws</dc:title>

    <dc:creator>Anitha Kannan</dc:creator>
    <dc:creator>John Winn</dc:creator>
    <dc:creator>Carsten Rother</dc:creator>
    <dc:source>Vol. 19 (2006)</dc:source>
    <dc:date>2007-01-30T09:33:40-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:volume>19</prism:volume>
    <prism:category>graphical-model</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/1072329">
    <title>Balanced Graph Matching</title>
    <link>http://www.citeulike.org/group/114/article/1072329</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>Balanced Graph Matching</dc:title>

    <dc:creator>Timothee Cour</dc:creator>
    <dc:creator>Praveen Srinivasan</dc:creator>
    <dc:creator>Jinbo Shi</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2007-01-28T07:48:44-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>graph-matching</prism:category>
    <prism:category>spectral</prism:category>
    <prism:category>spectral-matching</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/996973">
    <title>SURF: Speeded-Up Robust Features</title>
    <link>http://www.citeulike.org/group/114/article/996973</link>
    <description>&lt;i&gt;&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we present a novel scale- and rotation-invariant interest point detector and descriptor, coined SURF (Speeded Up Robust Features). It approximates or even outperforms previously proposed schemes with respect to repeatability, distinctiveness and robustness, yet can be computed and compared much faster. This is achieved by relying on integral images for image convolutions; by building on the strengths of the leading existing detectors and descriptors (in casu, using a Hessian matrix-based measure for the detector, and a distribution-based descriptor); and by simplifying these methods to the essential. This leads to a combination of novel detection, description, and matching steps. The paper presents experimental results on a standard evaluation set, as well as on imagery obtained in the context of a real-life object recognition application. Both show SURF's strong performance.</description>
    <dc:title>SURF: Speeded-Up Robust Features</dc:title>

    <dc:creator>Herbert Bay</dc:creator>
    <dc:creator>Tinne Tuytelaars</dc:creator>
    <dc:creator>Luc Van Gool</dc:creator>
    <dc:date>2006-12-15T13:52:54-00:00</dc:date>
    <prism:category>local-feature</prism:category>
    <prism:category>matching</prism:category>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>sift</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/965072">
    <title>Unsupervised Learning of Categories from Sets of Partially Matching Image Features</title>
    <link>http://www.citeulike.org/group/114/article/965072</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 19-25.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We present a method to automatically learn object categories from unlabeled images. Each image is represented by an unordered set of local features, and all sets are embedded into a space where they cluster according to their partial-match feature correspondences. After efficiently computing the pairwise affinities between the input images in this space, a spectral clustering technique is used to recover the primary groupings among the images. We introduce an efficient means of refining these groupings according to intra-cluster statistics over the subsets of features selected by the partial matches between the images, and based on an optional, variable amount of user supervision. We compute the consistent subsets of feature correspondences within a grouping to infer category feature masks. The output of the algorithm is a partition of the data into a set of learned categories, and a set of classifiers trained from these ranked partitions that can recognize the categories in novel images.</description>
    <dc:title>Unsupervised Learning of Categories from Sets of Partially Matching Image Features</dc:title>

    <dc:creator>K Grauman</dc:creator>
    <dc:creator>T Darrell</dc:creator>
    <dc:identifier>doi:10.1109/CVPR.2006.322</dc:identifier>
    <dc:source>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 1 (2006), pp. 19-25.</dc:source>
    <dc:date>2006-11-28T09:38:21-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>1</prism:volume>
    <prism:startingPage>19</prism:startingPage>
    <prism:endingPage>25</prism:endingPage>
    <prism:category>histogram</prism:category>
    <prism:category>kernel</prism:category>
    <prism:category>matching</prism:category>
    <prism:category>spatial-pyramid-matching</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/984042">
    <title>Video Google: a text retrieval approach to object matching in videos</title>
    <link>http://www.citeulike.org/group/114/article/984042</link>
    <description>&lt;i&gt;Computer Vision, 2003. Proceedings. Ninth IEEE International Conference on (2003), pp. 1470-1477 vol.2.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe an approach to object and scene retrieval which searches for and localizes all the occurrences of a user outlined object in a video. The object is represented by a set of viewpoint invariant region descriptors so that recognition can proceed successfully despite changes in viewpoint, illumination and partial occlusion. The temporal continuity of the video within a shot is used to track the regions in order to reject unstable regions and reduce the effects of noise in the descriptors. The analogy with text retrieval is in the implementation where matches on descriptors are pre-computed (using vector quantization), and inverted file systems and document rankings are used. The result is that retrieved is immediate, returning a ranked list of key frames/shots in the manner of Google. The method is illustrated for matching in two full length feature films.</description>
    <dc:title>Video Google: a text retrieval approach to object matching in videos</dc:title>

    <dc:creator>J Sivic</dc:creator>
    <dc:creator>A Zisserman</dc:creator>
    <dc:identifier>doi:10.1109/ICCV.2003.1238663</dc:identifier>
    <dc:source>Computer Vision, 2003. Proceedings. Ninth IEEE International Conference on (2003), pp. 1470-1477 vol.2.</dc:source>
    <dc:date>2006-12-08T04:52:56-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Computer Vision, 2003. Proceedings. Ninth IEEE International Conference on</prism:publicationName>
    <prism:startingPage>1470</prism:startingPage>
    <prism:endingPage>1477 vol.2</prism:endingPage>
    <prism:category>photo2search</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/977808">
    <title>A Visual Attention Based Region-of-Interest Determination Framework for Video Sequences</title>
    <link>http://www.citeulike.org/group/114/article/977808</link>
    <description>&lt;i&gt;IEICE - Trans. Inf. Syst., Vol. E88-D, No. 7. (2005), pp. 1578-1586.&lt;/i&gt;</description>
    <dc:title>A Visual Attention Based Region-of-Interest Determination Framework for Video Sequences</dc:title>

    <dc:creator>Wen-Huang Cheng</dc:creator>
    <dc:creator>Wei-Ta Chu</dc:creator>
    <dc:creator>Ja-Ling Wu</dc:creator>
    <dc:identifier>doi:10.1093/ietisy</dc:identifier>
    <dc:source>IEICE - Trans. Inf. Syst., Vol. E88-D, No. 7. (2005), pp. 1578-1586.</dc:source>
    <dc:date>2006-12-07T12:35:09-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>IEICE - Trans. Inf. Syst.</prism:publicationName>
    <prism:issn>0916-8532</prism:issn>
    <prism:volume>E88-D</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>1578</prism:startingPage>
    <prism:endingPage>1586</prism:endingPage>
    <prism:publisher>Oxford University Press</prism:publisher>
    <prism:category>attention</prism:category>
    <prism:category>spatial-temporal-analysis</prism:category>
    <prism:category>video-attention</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/977805">
    <title>Tiling slideshow</title>
    <link>http://www.citeulike.org/group/114/article/977805</link>
    <description>&lt;i&gt;(2006), pp. 25-34.&lt;/i&gt;</description>
    <dc:title>Tiling slideshow</dc:title>

    <dc:creator>Jun-Cheng Chen</dc:creator>
    <dc:creator>Wei-Ta Chu</dc:creator>
    <dc:creator>Jin-Hau Kuo</dc:creator>
    <dc:creator>Chung-Yi Weng</dc:creator>
    <dc:creator>Ja-Ling Wu</dc:creator>
    <dc:identifier>doi:10.1145/1180639.1180653</dc:identifier>
    <dc:source>(2006), pp. 25-34.</dc:source>
    <dc:date>2006-12-07T12:32:03-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>25</prism:startingPage>
    <prism:endingPage>34</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>adaptation</prism:category>
    <prism:category>attention-application</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/977802">
    <title>Automatic video region-of-interest determination based on user attention model</title>
    <link>http://www.citeulike.org/group/114/article/977802</link>
    <description>&lt;i&gt;Circuits and Systems, 2005. ISCAS 2005. IEEE International Symposium on (2005), pp. 3219-3222 Vol. 4.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The paper presents a framework for automatic video region-of-interest determination based on a user attention model. A set of attempts on using video attention features and knowledge of applied media aesthetics are made. The three types of visual attention features used are intensity, color, and motion. Referring to aesthetic principles, these features are combined according to camera motion types on the basis of a newly proposed video analysis unit, frame-segment. We conduct subjective experiments on several kinds of video data and demonstrate the effectiveness of the proposed framework.</description>
    <dc:title>Automatic video region-of-interest determination based on user attention model</dc:title>

    <dc:creator>Wen-Huang Cheng</dc:creator>
    <dc:creator>Wei-Ta Chu</dc:creator>
    <dc:creator>Jin-Hau Kuo</dc:creator>
    <dc:creator>Ja-Ling Wu</dc:creator>
    <dc:source>Circuits and Systems, 2005. ISCAS 2005. IEEE International Symposium on (2005), pp. 3219-3222 Vol. 4.</dc:source>
    <dc:date>2006-12-07T12:21:23-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Circuits and Systems, 2005. ISCAS 2005. IEEE International Symposium on</prism:publicationName>
    <prism:startingPage>3219</prism:startingPage>
    <prism:endingPage>3222 Vol. 4</prism:endingPage>
    <prism:category>video-attention</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/911348">
    <title>Visual Attention Detection in Video Sequences Using Spatiotemporal Cues</title>
    <link>http://www.citeulike.org/group/114/article/911348</link>
    <description>&lt;i&gt;ACM International Conference on Multimedia (ACM MM) (2006)&lt;/i&gt;</description>
    <dc:title>Visual Attention Detection in Video Sequences Using Spatiotemporal Cues</dc:title>

    <dc:creator>Yun Zhai</dc:creator>
    <dc:creator>Mubarak Shah</dc:creator>
    <dc:source>ACM International Conference on Multimedia (ACM MM) (2006)</dc:source>
    <dc:date>2006-10-24T17:55:26-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>ACM International Conference on Multimedia (ACM MM)</prism:publicationName>
    <prism:category>spatial-temporal-analysis</prism:category>
    <prism:category>video-attention</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/957702">
    <title>A Comparison of Affine Region Detectors</title>
    <link>http://www.citeulike.org/group/114/article/957702</link>
    <description>&lt;i&gt;Int. J. Comput. Vision, Vol. 65, No. 1-2. (2005), pp. 43-72.&lt;/i&gt;</description>
    <dc:title>A Comparison of Affine Region Detectors</dc:title>

    <dc:creator>K Mikolajczyk</dc:creator>
    <dc:creator>T Tuytelaars</dc:creator>
    <dc:creator>C Schmid</dc:creator>
    <dc:creator>A Zisserman</dc:creator>
    <dc:creator>J Matas</dc:creator>
    <dc:creator>F Schaffalitzky</dc:creator>
    <dc:creator>T Kadir</dc:creator>
    <dc:creator>L Van Gool</dc:creator>
    <dc:identifier>doi:10.1007/s11263-005-3848-x</dc:identifier>
    <dc:source>Int. J. Comput. Vision, Vol. 65, No. 1-2. (2005), pp. 43-72.</dc:source>
    <dc:date>2006-11-22T16:54:07-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Int. J. Comput. Vision</prism:publicationName>
    <prism:issn>0920-5691</prism:issn>
    <prism:volume>65</prism:volume>
    <prism:number>1-2</prism:number>
    <prism:startingPage>43</prism:startingPage>
    <prism:endingPage>72</prism:endingPage>
    <prism:publisher>Kluwer Academic Publishers</prism:publisher>
    <prism:category>interest-point-detector</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/974355">
    <title>An efficient parts-based near-duplicate and sub-image retrieval system</title>
    <link>http://www.citeulike.org/group/114/article/974355</link>
    <description>&lt;i&gt;(2004), pp. 869-876.&lt;/i&gt;</description>
    <dc:title>An efficient parts-based near-duplicate and sub-image retrieval system</dc:title>

    <dc:creator>Yan Ke</dc:creator>
    <dc:creator>Rahul Sukthankar</dc:creator>
    <dc:creator>Larry Huston</dc:creator>
    <dc:identifier>doi:10.1145/1027527.1027729</dc:identifier>
    <dc:source>(2004), pp. 869-876.</dc:source>
    <dc:date>2006-12-05T07:28:54-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:startingPage>869</prism:startingPage>
    <prism:endingPage>876</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>photo2search</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/974063">
    <title>Scalable Recognition with a Vocabulary Tree</title>
    <link>http://www.citeulike.org/group/114/article/974063</link>
    <description>&lt;i&gt;Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 2 (2006), pp. 2161-2168.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A recognition scheme that scales efficiently to a large number of objects is presented. The efficiency and quality is exhibited in a live demonstration that recognizes CD-covers from a database of 40000 images of popular music CD&#146;s. The scheme builds upon popular techniques of indexing descriptors extracted from local regions, and is robust to background clutter and occlusion. The local region descriptors are hierarchically quantized in a vocabulary tree. The vocabulary tree allows a larger and more discriminatory vocabulary to be used efficiently, which we show experimentally leads to a dramatic improvement in retrieval quality. The most significant property of the scheme is that the tree directly defines the quantization. The quantization and the indexing are therefore fully integrated, essentially being one and the same. The recognition quality is evaluated through retrieval on a database with ground truth, showing the power of the vocabulary tree approach, going as high as 1 million images.</description>
    <dc:title>Scalable Recognition with a Vocabulary Tree</dc:title>

    <dc:creator>D Nister</dc:creator>
    <dc:creator>H Stewenius</dc:creator>
    <dc:source>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on, Vol. 2 (2006), pp. 2161-2168.</dc:source>
    <dc:date>2006-12-05T03:35:14-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Computer Vision and Pattern Recognition, 2006 IEEE Computer Society Conference on</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:startingPage>2161</prism:startingPage>
    <prism:endingPage>2168</prism:endingPage>
    <prism:category>object-categorization</prism:category>
    <prism:category>object-recognition</prism:category>
    <prism:category>photo2search</prism:category>
    <prism:category>reading</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/973069">
    <title>SURF: Speeded Up Robust Features</title>
    <link>http://www.citeulike.org/group/114/article/973069</link>
    <description>&lt;i&gt;(7-13 May 2006)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we present a novel scale- and rotation-invariant interest point detector and descriptor, coined SURF (Speeded Up Robust Features). It approximates or even outperforms previously proposed schemes with respect to repeatability, distinctiveness, and robustness, yet can be computed and compared much faster. This is achieved by replying on integral images for image convolutions; by building on the strengths of the leading existing detectors and descriptors (in casu, using a Hessian matrix-based measure for the detector, and a distribution-based descriptor); and by simplifying these methods to the essential. This leads to a combination of novel detection, description, and matching steps. The paper presents experimental results on a standard evaluation set, as well as on imagery obtained in the context of a real-life object recognition application. Both show SURF's strong performance.</description>
    <dc:title>SURF: Speeded Up Robust Features</dc:title>

    <dc:creator>Herbert Bay</dc:creator>
    <dc:creator>Tinne Tuytelaars</dc:creator>
    <dc:creator>And Van Gool</dc:creator>
    <dc:source>(7-13 May 2006)</dc:source>
    <dc:date>2006-12-04T13:24:26-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>local-feature</prism:category>
    <prism:category>sift</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/973036">
    <title>Photo-to-Search: Using Camera Phones to Inquire of the Surrounding World</title>
    <link>http://www.citeulike.org/group/114/article/973036</link>
    <description>&lt;i&gt;Mobile Data Management, 2006. MDM 2006. 7th International Conference on (2006), pp. 46-46.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;With the pervasive use of camera phones, the embedded camera has been considered as a promising HCI manner for mobiles. With necessary technologies, it is possible to become a powerful tool to acquire the information in daily life. We have designed and implemented a system named Photo-to-Search to carry out queries from camera phones simply by taking some photos of interested objects. The captured pictures are compared with a large amount of Web images to select the ones which contain the same prominent object. Consequently, the related information is extracted from the Web pages where the matched images locate. In our demo, data of large buildings, storefronts and products are collected and these kinds of queries are specifically demonstrated to show the efficiency and the effectiveness of our system.</description>
    <dc:title>Photo-to-Search: Using Camera Phones to Inquire of the Surrounding World</dc:title>

    <dc:creator>Menglei Jia</dc:creator>
    <dc:creator>Xin Fan</dc:creator>
    <dc:creator>Xing Xie</dc:creator>
    <dc:creator>Mingjing Li</dc:creator>
    <dc:creator>Wei-Ying Ma</dc:creator>
    <dc:source>Mobile Data Management, 2006. MDM 2006. 7th International Conference on (2006), pp. 46-46.</dc:source>
    <dc:date>2006-12-04T12:53:15-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Mobile Data Management, 2006. MDM 2006. 7th International Conference on</prism:publicationName>
    <prism:startingPage>46</prism:startingPage>
    <prism:endingPage>46</prism:endingPage>
    <prism:category>photo2search</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/972899">
    <title>Video retargeting: automating pan and scan</title>
    <link>http://www.citeulike.org/group/114/article/972899</link>
    <description>&lt;i&gt;(2006), pp. 241-250.&lt;/i&gt;</description>
    <dc:title>Video retargeting: automating pan and scan</dc:title>

    <dc:creator>Feng Liu</dc:creator>
    <dc:creator>Michael Gleicher</dc:creator>
    <dc:identifier>doi:10.1145/1180639.1180702</dc:identifier>
    <dc:source>(2006), pp. 241-250.</dc:source>
    <dc:date>2006-12-04T07:19:44-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>241</prism:startingPage>
    <prism:endingPage>250</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>toread</prism:category>
    <prism:category>video-attention</prism:category>
    <prism:category>video-synthesis</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/967062">
    <title>Full-frame video stabilization with motion inpainting</title>
    <link>http://www.citeulike.org/group/114/article/967062</link>
    <description>&lt;i&gt;Pattern Analysis and Machine Intelligence, IEEE Transactions on, Vol. 28, No. 7. (2006), pp. 1150-1163.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Video stabilization is an important video enhancement technology which aims at removing annoying shaky motion from videos. We propose a practical and robust approach of video stabilization that produces full-frame stabilized videos with good visual quality. While most previous methods end up with producing smaller size stabilized videos, our completion method can produce full-frame videos by naturally filling in missing image parts by locally aligning image data of neighboring frames. To achieve this, motion inpainting is proposed to enforce spatial and temporal consistency of the completion in both static and dynamic image areas. In addition, image quality in the stabilized video is enhanced with a new practical deblurring algorithm. Instead of estimating point spread functions, our method transfers and interpolates sharper image pixels of neighboring frames to increase the sharpness of the frame. The proposed video completion and deblurring methods enabled us to develop a complete video stabilizer which can naturally keep the original image quality in the stabilized videos. The effectiveness of our method is confirmed by extensive experiments over a wide variety of videos.</description>
    <dc:title>Full-frame video stabilization with motion inpainting</dc:title>

    <dc:creator>Y Matsushita</dc:creator>
    <dc:creator>E Ofek</dc:creator>
    <dc:creator>Weina Ge</dc:creator>
    <dc:creator>Xiaoou Tang</dc:creator>
    <dc:creator>Heung-Yeung Shum</dc:creator>
    <dc:source>Pattern Analysis and Machine Intelligence, IEEE Transactions on, Vol. 28, No. 7. (2006), pp. 1150-1163.</dc:source>
    <dc:date>2006-11-29T17:08:59-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:publicationName>Pattern Analysis and Machine Intelligence, IEEE Transactions on</prism:publicationName>
    <prism:volume>28</prism:volume>
    <prism:number>7</prism:number>
    <prism:startingPage>1150</prism:startingPage>
    <prism:endingPage>1163</prism:endingPage>
    <prism:category>video-stabilization</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/group/114/article/961316">
    <title>Markov random field modeling in image analysis</title>
    <link>http://www.citeulike.org/group/114/article/961316</link>
    <description>&lt;i&gt;(2001)&lt;/i&gt;</description>
    <dc:title>Markov random field modeling in image analysis</dc:title>

    <dc:creator>Stan Li</dc:creator>
    <dc:source>(2001)</dc:source>
    <dc:date>2006-11-25T06:22:13-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:publisher>Springer-Verlag New York, Inc.</prism:publisher>
    <prism:category>graphical-model</prism:category>
    <prism:category>learning</prism:category>
    <prism:category>markov-random-field</prism:category>
</item>



</rdf:RDF>

