<?xml version="1.0" encoding="UTF-8"?>

<rdf:RDF
   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
   xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
   xmlns="http://purl.org/rss/1.0/"
   xmlns:dc="http://purl.org/dc/elements/1.1/"
   xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/"
   xmlns:dcterms="http://purl.org/dc/terms/"

>
<channel rdf:about="http://www.citeulike.org/about">
<pubDate>Sat, 26 Jul 2008 04:34:52 BST</pubDate>


	<title>CiteULike: V's library [127 articles]</title>
	<description>CiteULike: V's library [127 articles]</description>


	<link>http://www.citeulike.org/user/V</link>
	<dc:publisher>CiteULike.org</dc:publisher>
	<dc:language>en-gb</dc:language>
	<dc:rights>Copyright &#169; 2004-2008 citeulike.org</dc:rights>
	<items>
    <rdf:Seq>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2111841"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2820988"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2820969"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/472852"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2749926"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2730957"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2730934"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2730868"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2730859"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2730857"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/104300"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683417"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683381"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683375"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683368"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/1135329"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683339"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683317"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2683281"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/465806"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682924"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682917"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682599"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682567"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682535"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682512"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682508"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682339"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682323"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682305"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2682285"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2678768"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/745875"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2679226"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2679215"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253110"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/259537"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253101"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253086"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253083"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253071"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2253067"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2204598"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2204587"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2204567"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/329575"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/2057345"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/1559292"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/1559288"/>
        <rdf:li rdf:resource="http://www.citeulike.org/user/V/article/1559277"/>

	</rdf:Seq>
	</items>
	</channel>


<item rdf:about="http://www.citeulike.org/user/V/article/2111841">
    <title>Iterative classification in relational data</title>
    <link>http://www.citeulike.org/user/V/article/2111841</link>
    <description>&lt;i&gt;(2000)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Relational data offer a unique opportunity for improving the classification accuracy of statistical models. If two objects are related, inferring something about one object can aid inferences about the other. We present an iterative classification procedure that exploits this characteristic of relational data. This approach uses simple Bayesian classifiers in an iterative fashion, dynamically updating the attributes of some objects as inferences are made about related objects. Inferences made...</description>
    <dc:title>Iterative classification in relational data</dc:title>

    <dc:creator>J Neville</dc:creator>
    <dc:creator>D Jensen</dc:creator>
    <dc:source>(2000)</dc:source>
    <dc:date>2007-12-14T06:29:46-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:category>bayes</prism:category>
    <prism:category>classification</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2820988">
    <title>The Probabilistic Program Dependence Graph and its Application to Fault Diagnosis</title>
    <link>http://www.citeulike.org/user/V/article/2820988</link>
    <description>&lt;i&gt;(23 July 2008)&lt;/i&gt;</description>
    <dc:title>The Probabilistic Program Dependence Graph and its Application to Fault Diagnosis</dc:title>

    <dc:creator>George Baah</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:creator>Mary Harrold</dc:creator>
    <dc:source>(23 July 2008)</dc:source>
    <dc:date>2008-05-21T18:19:00-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>debugging</prism:category>
    <prism:category>dependencygraph</prism:category>
    <prism:category>statistics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2820969">
    <title>Statistical Debugging Using Latent Topic Models</title>
    <link>http://www.citeulike.org/user/V/article/2820969</link>
    <description>&lt;i&gt;Machine Learning: ECML 2007 (2007), pp. 6-17.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Statistical debugging uses machine learning to model program failures and help identify root causes of bugs. We approach this task using a novel Delta-Latent-Dirichlet-Allocation model. We model execution traces attributed to failed runs of a program as being generated by two types of latent topics: normal usage topics and bug topics. Execution traces attributed to successful runs of the same program, however, are modeled by usage topics only. Joint modeling of both kinds of traces allows us to identify weak bug topics that would otherwise remain undetected. We perform model inference with collapsed Gibbs sampling. In quantitative evaluations on four real programs, our model produces bug topics highly correlated to the true bugs, as measured by the Rand index. Qualitative evaluation by domain experts suggests that our model outperforms existing statistical methods for bug cause identification, and may help support other software tasks not addressed by earlier models.</description>
    <dc:title>Statistical Debugging Using Latent Topic Models</dc:title>

    <dc:creator>David Andrzejewski</dc:creator>
    <dc:creator>Anne Mulhern</dc:creator>
    <dc:creator>Ben Liblit</dc:creator>
    <dc:creator>Xiaojin Zhu</dc:creator>
    <dc:identifier>doi:10.1007/978-3-540-74958-5_5</dc:identifier>
    <dc:source>Machine Learning: ECML 2007 (2007), pp. 6-17.</dc:source>
    <dc:date>2008-05-21T18:05:35-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Machine Learning: ECML 2007</prism:publicationName>
    <prism:startingPage>6</prism:startingPage>
    <prism:endingPage>17</prism:endingPage>
    <prism:category>debugging</prism:category>
    <prism:category>markov</prism:category>
    <prism:category>statistical</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/472852">
    <title>Visualization of test information to assist fault localization</title>
    <link>http://www.citeulike.org/user/V/article/472852</link>
    <description>&lt;i&gt;(2002), pp. 467-477.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;One of the most expensive and time-consuming components of the debugging process is locating the errors or faults. To locate faults, developers must identify statements involved in failures and select suspicious statements that might contain faults. This paper presents a new technique that uses visualization to assist with these tasks. The technique uses color to visually map the participation of each program statement in the outcome of the execution of the program with a test suite, consisting of both passed and failed test cases. Based on this visual mapping, a user can inspect the statements in the program, identify statements involved in failures, and locate potentially faulty statements. The paper also describes a prototype tool that implements our technique along with a set of empirical studies that use the tool for evaluation of the technique. The empirical studies show that, for the subject we studied, the technique can be effective in helping a user locate faults in a program.</description>
    <dc:title>Visualization of test information to assist fault localization</dc:title>

    <dc:creator>James Jones</dc:creator>
    <dc:creator>Mary Harrold</dc:creator>
    <dc:creator>John Stasko</dc:creator>
    <dc:identifier>doi:10.1145/581339.581397</dc:identifier>
    <dc:source>(2002), pp. 467-477.</dc:source>
    <dc:date>2006-01-20T19:41:55-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:startingPage>467</prism:startingPage>
    <prism:endingPage>477</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>fault_localization</prism:category>
    <prism:category>sw_engineering</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2749926">
    <title>Xerces2 Java Parser</title>
    <link>http://www.citeulike.org/user/V/article/2749926</link>
    <description>&lt;i&gt;(2007)&lt;/i&gt;</description>
    <dc:title>Xerces2 Java Parser</dc:title>

    <dc:creator>The Apache Project</dc:creator>
    <dc:source>(2007)</dc:source>
    <dc:date>2008-05-03T19:26:59-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>dataset</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2730957">
    <title>RBGL: An interface to the BOOST graph library</title>
    <link>http://www.citeulike.org/user/V/article/2730957</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>RBGL: An interface to the BOOST graph library</dc:title>

    <dc:creator>Vince Carey</dc:creator>
    <dc:creator>Li Long</dc:creator>
    <dc:creator>R Gentleman</dc:creator>
    <dc:date>2008-04-28T20:16:31-00:00</dc:date>
    <prism:category>eecs435</prism:category>
    <prism:category>graph_theory</prism:category>
    <prism:category>rpkg</prism:category>
    <prism:category>tool</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2730934">
    <title>Semi-Supervised Learning Literature Survey</title>
    <link>http://www.citeulike.org/user/V/article/2730934</link>
    <description>&lt;i&gt;(14 December 2007)&lt;/i&gt;</description>
    <dc:title>Semi-Supervised Learning Literature Survey</dc:title>

    <dc:creator>Xiaojin Zhu</dc:creator>
    <dc:source>(14 December 2007)</dc:source>
    <dc:date>2008-04-28T20:05:07-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:category>eecs435</prism:category>
    <prism:category>semi-supervised_learning</prism:category>
    <prism:category>survey</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2730868">
    <title>The Java Interactive Profiler</title>
    <link>http://www.citeulike.org/user/V/article/2730868</link>
    <description>&lt;i&gt;(2006)&lt;/i&gt;</description>
    <dc:title>The Java Interactive Profiler</dc:title>

    <dc:creator>JIP Development Team</dc:creator>
    <dc:source>(2006)</dc:source>
    <dc:date>2008-04-28T19:30:19-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:category>eecs435</prism:category>
    <prism:category>java</prism:category>
    <prism:category>profiling</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>tool</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2730859">
    <title>Learning from Labeled and Unlabeled Data using Graph Mincuts</title>
    <link>http://www.citeulike.org/user/V/article/2730859</link>
    <description>&lt;i&gt;(2001), pp. 19-26.&lt;/i&gt;</description>
    <dc:title>Learning from Labeled and Unlabeled Data using Graph Mincuts</dc:title>

    <dc:creator>Avrim Blum</dc:creator>
    <dc:creator>Shuchi Chawla</dc:creator>
    <dc:source>(2001), pp. 19-26.</dc:source>
    <dc:date>2008-04-28T19:26:43-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:startingPage>19</prism:startingPage>
    <prism:endingPage>26</prism:endingPage>
    <prism:publisher>Morgan Kaufmann Publishers Inc.</prism:publisher>
    <prism:category>eecs435</prism:category>
    <prism:category>semi-supervised_learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2730857">
    <title>ROME: RSS/Atom syndication and publishing tools</title>
    <link>http://www.citeulike.org/user/V/article/2730857</link>
    <description>&lt;i&gt;(2005)&lt;/i&gt;</description>
    <dc:title>ROME: RSS/Atom syndication and publishing tools</dc:title>

    <dc:creator>ROME Development Team</dc:creator>
    <dc:source>(2005)</dc:source>
    <dc:date>2008-04-28T19:25:41-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:category>dataset</prism:category>
    <prism:category>eecs435</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/104300">
    <title>Semi-supervised learning using randomized mincuts</title>
    <link>http://www.citeulike.org/user/V/article/104300</link>
    <description>&lt;i&gt;(2004)&lt;/i&gt;</description>
    <dc:title>Semi-supervised learning using randomized mincuts</dc:title>

    <dc:creator>Avrim Blum</dc:creator>
    <dc:creator>John Lafferty</dc:creator>
    <dc:creator>Mugizi Rwebangira</dc:creator>
    <dc:creator>Rajashekar Reddy</dc:creator>
    <dc:identifier>doi:10.1145/1015330.1015429</dc:identifier>
    <dc:source>(2004)</dc:source>
    <dc:date>2005-02-25T22:20:40-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>eecs435</prism:category>
    <prism:category>semi-supervised_learning</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683417">
    <title>A New Approach for Event Correlation based on Dependency Graphs</title>
    <link>http://www.citeulike.org/user/V/article/2683417</link>
    <description>&lt;i&gt;(1998)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Today's fault management is characterized by inefficient event management. The events delivered by the managed system frequently descibe symptoms of a problem instead of its cause. If a problem in the managed system occurs, e.g. a network failure or misconfigured software, the administrator often is flooded by a burst of more or less meaningless events indicating symptoms of the problem. The aim of an event correlator is to reduce the number and enrich the meaning of events shown to the...</description>
    <dc:title>A New Approach for Event Correlation based on Dependency Graphs</dc:title>

    <dc:creator>B Gruschke</dc:creator>
    <dc:source>(1998)</dc:source>
    <dc:date>2008-04-17T20:20:42-00:00</dc:date>
    <prism:publicationYear>1998</prism:publicationYear>
    <prism:category>dependencygraph</prism:category>
    <prism:category>event_correlation</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683381">
    <title>Alarm correlation and fault identification in communication networks</title>
    <link>http://www.citeulike.org/user/V/article/2683381</link>
    <description>&lt;i&gt;Communications, IEEE Transactions on, Vol. 42, No. 234. (1994), pp. 523-533.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Presents an approach for modeling and solving the problem of fault identification and alarm correlation in large communication networks. A single fault in a large network may result in a large number of alarms, and it is often very difficult to isolate the true cause of the fault. This appears to be one of the most important difficulties in managing faults in today's networks. The problem may become worse in the case of multiple faults. The authors present a general methodology for solving the alarm correlation and fault identification problem. They propose a new alarm structure, propose a general model for representing the network, and give two algorithms which can solve the alarm correlation and fault identification problem in the presence of multiple faults. These algorithms differ in the degree of accuracy achieved in identifying the fault, and in the degree of complexity required for implementation</description>
    <dc:title>Alarm correlation and fault identification in communication networks</dc:title>

    <dc:creator>AT Bouloutas</dc:creator>
    <dc:creator>S Calo</dc:creator>
    <dc:creator>A Finkel</dc:creator>
    <dc:identifier>doi:10.1109/TCOMM.1994.577079</dc:identifier>
    <dc:source>Communications, IEEE Transactions on, Vol. 42, No. 234. (1994), pp. 523-533.</dc:source>
    <dc:date>2008-04-17T20:09:26-00:00</dc:date>
    <prism:publicationYear>1994</prism:publicationYear>
    <prism:publicationName>Communications, IEEE Transactions on</prism:publicationName>
    <prism:volume>42</prism:volume>
    <prism:number>234</prism:number>
    <prism:startingPage>523</prism:startingPage>
    <prism:endingPage>533</prism:endingPage>
    <prism:category>distributed</prism:category>
    <prism:category>event_correlation</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683375">
    <title>High speed and robust event correlation</title>
    <link>http://www.citeulike.org/user/V/article/2683375</link>
    <description>&lt;i&gt;Communications Magazine, IEEE, Vol. 34, No. 5. (1996), pp. 82-90.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;The authors describe a network management system and illustrate its application to managing a distributed database application on a complex enterprise network</description>
    <dc:title>High speed and robust event correlation</dc:title>

    <dc:creator>SA Yemini</dc:creator>
    <dc:creator>S Kliger</dc:creator>
    <dc:creator>E Mozes</dc:creator>
    <dc:creator>Y Yemini</dc:creator>
    <dc:creator>D Ohsie</dc:creator>
    <dc:identifier>doi:10.1109/35.492975</dc:identifier>
    <dc:source>Communications Magazine, IEEE, Vol. 34, No. 5. (1996), pp. 82-90.</dc:source>
    <dc:date>2008-04-17T20:07:39-00:00</dc:date>
    <prism:publicationYear>1996</prism:publicationYear>
    <prism:publicationName>Communications Magazine, IEEE</prism:publicationName>
    <prism:volume>34</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>82</prism:startingPage>
    <prism:endingPage>90</prism:endingPage>
    <prism:category>distributed</prism:category>
    <prism:category>event_correlation</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683368">
    <title>Extracting the Representative Failure Executions via Clustering Analysis Based on Markov Profile Model</title>
    <link>http://www.citeulike.org/user/V/article/2683368</link>
    <description>&lt;i&gt;Advanced Data Mining and Applications (2005), pp. 217-224.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;During the debugging of a program to be released, it is unnecessary and impractical for developers to check every failure execution. How to extract the typical ones from the vast set of failure executions is very important for reducing the debugging efforts. In this paper, a revised Markov model used to depict program behaviors is presented firstly. Based on this model, the dissimilarity of two profile matrixes is also defined. After separating the failure executions and non-failure executions into two different subsets, iterative partition clustering and a sampling strategy called priority-ranked n-per-cluster are employed to extract representative failure executions. Finally, with the assistance of our prototype CppTest, we have performed experiment on five subject programs. The results show that the clustering and sampling techniques based on revised Markov model is more effective to find faults than Podgurski’s method.</description>
    <dc:title>Extracting the Representative Failure Executions via Clustering Analysis Based on Markov Profile Model</dc:title>

    <dc:creator>Chengying Mao</dc:creator>
    <dc:creator>Yansheng Lu</dc:creator>
    <dc:identifier>doi:10.1007/11527503_26</dc:identifier>
    <dc:source>Advanced Data Mining and Applications (2005), pp. 217-224.</dc:source>
    <dc:date>2008-04-17T20:02:25-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publicationName>Advanced Data Mining and Applications</prism:publicationName>
    <prism:startingPage>217</prism:startingPage>
    <prism:endingPage>224</prism:endingPage>
    <prism:category>classification</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>markov</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/1135329">
    <title>Failure proximity: a fault localization-based approach</title>
    <link>http://www.citeulike.org/user/V/article/1135329</link>
    <description>&lt;i&gt;(2006), pp. 46-56.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Recent software systems usually feature an automated failure reporting system, with which a huge number of failing traces are collected every day. In order to prioritize fault diagnosis, failing traces due to the same fault are expected to be grouped together. Previous methods, by hypothesizing that similar failing traces imply the same fault, cluster failing traces based on the literal trace similarity, which we call trace proximity. However, since a fault can be triggered in many ways, failing traces due to the same fault can be quite different. Therefore, previous methods actually group together traces exhibiting similar behaviors, like similar branch coverage, rather than traces due to the same fault. In this paper, we propose a new type of failure proximity, called R-Proximity, which regards two failing traces as similar if they suggest roughly the same fault location. The fault location each failing case suggests is automatically obtained with Sober, an existing statistical debugging tool. We show that with R-Proximity, failing traces due to the same fault can be grouped together. In addition, we find that R-Proximity is helpful for statistical debugging: It can help developers interpret and utilize the statistical debugging result. We illustrate the usage of R-Proximity with a case study on the grep program and some experiments on the Siemens suite, and the result clearly demonstrates the advantage of R-Proximity over trace proximity.</description>
    <dc:title>Failure proximity: a fault localization-based approach</dc:title>

    <dc:creator>Chao Liu</dc:creator>
    <dc:creator>Jiawei Han</dc:creator>
    <dc:identifier>doi:10.1145/1181775.1181782</dc:identifier>
    <dc:source>(2006), pp. 46-56.</dc:source>
    <dc:date>2007-03-02T06:36:57-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>46</prism:startingPage>
    <prism:endingPage>56</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>fault_localization</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683339">
    <title>Pinpoint: problem determination in large, dynamic Internet services</title>
    <link>http://www.citeulike.org/user/V/article/2683339</link>
    <description>&lt;i&gt;Dependable Systems and Networks, 2002. DSN 2002. Proceedings. International Conference on (2002), pp. 595-604.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Traditional problem determination techniques rely on static dependency models that are difficult to generate accurately in today's large, distributed, and dynamic application environments such as e-commerce systems. We present a dynamic analysis methodology that automates problem determination in these environments by 1) coarse-grained tagging of numerous real client requests as they travel through the system and 2) using data mining techniques to correlate the believed failures and successes of these requests to determine which components are most likely to be at fault. To validate our methodology, we have implemented Pinpoint, a framework for root cause analysis on the J2EE platform that requires no knowledge of the application components. Pinpoint consists of three parts: a communications layer that traces client requests, a failure detector that uses traffic-sniffing and middleware instrumentation, and a data analysis engine. We evaluate Pinpoint by injecting faults into various application components and show that Pinpoint identifies the faulty components with high accuracy and produces few false-positives.</description>
    <dc:title>Pinpoint: problem determination in large, dynamic Internet services</dc:title>

    <dc:creator>MY Chen</dc:creator>
    <dc:creator>E Kiciman</dc:creator>
    <dc:creator>E Fratkin</dc:creator>
    <dc:creator>A Fox</dc:creator>
    <dc:creator>E Brewer</dc:creator>
    <dc:identifier>doi:10.1109/DSN.2002.1029005</dc:identifier>
    <dc:source>Dependable Systems and Networks, 2002. DSN 2002. Proceedings. International Conference on (2002), pp. 595-604.</dc:source>
    <dc:date>2008-04-17T19:53:09-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publicationName>Dependable Systems and Networks, 2002. DSN 2002. Proceedings. International Conference on</prism:publicationName>
    <prism:startingPage>595</prism:startingPage>
    <prism:endingPage>604</prism:endingPage>
    <prism:category>anomaly_detection</prism:category>
    <prism:category>distributed</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683317">
    <title>Improved error reporting for software that uses black-box components</title>
    <link>http://www.citeulike.org/user/V/article/2683317</link>
    <description>&lt;i&gt;(2007), pp. 101-111.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;An error occurs when software cannot complete a requested action as a result of some problem with its input, configuration, or environment. A high-quality error report allows a user to understand and correct the problem. Unfortunately, the quality of error reports has been decreasing as software becomes more complex and layered. End-users take the cryptic error messages given to them by programsand struggle to fix their problems using search engines and support websites. Developers cannot improve their error messages when they receive an ambiguous or otherwise insufficient error indicator from a black-box software component. We introduce Clarify, a system that improves error reporting by classifying application behavior. Clarify uses minimally invasive monitoring to generate a behavior profile, which is a summary of the program's execution history. A machine learning classifier uses the behavior profile to classify the application's behavior, thereby enabling a more precise error report than the output of the application itself. We evaluate a prototype Clarify system on ambiguous error messages generated by large, modern applications like gcc, La-TeX, and the Linux kernel. For a performance cost of less than 1% on user applications and 4.7% on the Linux kernel, the proto type correctly disambiguates at least 85% of application behaviors that result in ambiguous error reports. This accuracy does not degrade significantly with more behaviors: a Clarify classifier for 81 La-TeX error messages is at most 2.5% less accurate than a classifier for 27 LaTeX error messages. Finally, we show that without any human effort to build a classifier, Clarify can provide nearest-neighbor software support, where users who experience a problem are told about 5 other users who might have had the same problem. On average 2.3 of the 5 users that Clarify identifies have experienced the same problem.</description>
    <dc:title>Improved error reporting for software that uses black-box components</dc:title>

    <dc:creator>Jungwoo Ha</dc:creator>
    <dc:creator>Christopher Rossbach</dc:creator>
    <dc:creator>Jason Davis</dc:creator>
    <dc:creator>Indrajit Roy</dc:creator>
    <dc:creator>Hany Ramadan</dc:creator>
    <dc:creator>Donald Porter</dc:creator>
    <dc:creator>David Chen</dc:creator>
    <dc:creator>Emmett Witchel</dc:creator>
    <dc:identifier>doi:10.1145/1250734.1250747</dc:identifier>
    <dc:source>(2007), pp. 101-111.</dc:source>
    <dc:date>2008-04-17T19:49:22-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>101</prism:startingPage>
    <prism:endingPage>111</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>beta_testing</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2683281">
    <title>An empirical evaluation of test case filtering techniques based on exercising complex information flows</title>
    <link>http://www.citeulike.org/user/V/article/2683281</link>
    <description>&lt;i&gt;(2005), pp. 412-421.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Some software defects trigger failures only when certain complex information flows occur within the software. Profiling and analyzing such flows therefore provides a potentially important basis for filtering test cases. We report the results of an empirical evaluation of several test case filtering techniques that are based on exercising complex information flows. Both coverage-based and profile-distribution-based filtering techniques are considered. They are compared to filtering techniques based on exercising basic blocks, branches, function calls, and def-use pairs, with respect to their effectiveness for revealing defects.</description>
    <dc:title>An empirical evaluation of test case filtering techniques based on exercising complex information flows</dc:title>

    <dc:creator>David Leon</dc:creator>
    <dc:creator>Wes Masri</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:identifier>doi:10.1145/1062455.1062531</dc:identifier>
    <dc:source>(2005), pp. 412-421.</dc:source>
    <dc:date>2008-04-17T19:39:39-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:startingPage>412</prism:startingPage>
    <prism:endingPage>421</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>fse08</prism:category>
    <prism:category>information_flow</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/465806">
    <title>What Is Web 2.0: Design Patterns and Business Models for the Next Generation of Software</title>
    <link>http://www.citeulike.org/user/V/article/465806</link>
    <description>&lt;i&gt;(30 September 2005)&lt;/i&gt;</description>
    <dc:title>What Is Web 2.0: Design Patterns and Business Models for the Next Generation of Software</dc:title>

    <dc:creator>Tim O'Reilly</dc:creator>
    <dc:source>(30 September 2005)</dc:source>
    <dc:date>2006-01-15T22:39:46-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publisher>O'Reilly Media, Inc</prism:publisher>
    <prism:category>fse08</prism:category>
    <prism:category>news</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>web20</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682924">
    <title>A long winding road out of beta</title>
    <link>http://www.citeulike.org/user/V/article/2682924</link>
    <description>&lt;i&gt;(11 February 2005)&lt;/i&gt;</description>
    <dc:title>A long winding road out of beta</dc:title>

    <dc:creator>Paul Festa</dc:creator>
    <dc:source>(11 February 2005)</dc:source>
    <dc:date>2008-04-17T16:48:44-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:publisher>ZDNet</prism:publisher>
    <prism:category>beta_testing</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>news</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682917">
    <title>Beta Testing for Better Software</title>
    <link>http://www.citeulike.org/user/V/article/2682917</link>
    <description>&lt;i&gt;(23 August 2002)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Implement, operate, and use beta testing immediately with this hands-on guide to the best practices &#60;P&#62;Beta testing is a complex process that, when properly run, provides a wealth of diverse information. But when poorly executed, it delivers little or no data while wasting time and money. Written by a leading expert in the field, this book will help you reach the full potential that beta testing has to offer. &#60;P&#62;Michael Fine compiles the best practices to date so you can effectively bring beta testing into your company’s process to improve product quality. Using real-world case studies, this book begins by clearly explaining what a beta is and why you need one. Fine then explores the beta test procedure and walks through the best processes to use when implementing a test. He concludes by detailing the steps you should take after completing a test in order to take full advantage of the results. &#60;P&#62;With this book, you’ll gain a better understanding of what beta testing is, why every company needs a beta test program, and how to get the most from a test. Fine will help you: &#60;UL&#62; &#60;LI&#62;Understand all the steps involved in beta testing using real-world case studies&#60;/LI&#62; &#60;LI&#62;Implement a beta test using best- known practices&#60;/LI&#62; &#60;LI&#62;Produce better products based on the results of well-run beta tests&#60;/LI&#62; &#60;LI&#62;Apply beta testing across many platforms and many technologies&#60;/LI&#62; &#60;LI&#62;Improve on existing processes and identify critical issues&#60;/LI&#62;&#60;/UL&#62;</description>
    <dc:title>Beta Testing for Better Software</dc:title>

    <dc:creator>Michael Fine</dc:creator>
    <dc:source>(23 August 2002)</dc:source>
    <dc:date>2008-04-17T16:44:30-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:publisher>Wiley</prism:publisher>
    <prism:category>beta_testing</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682599">
    <title>jRapture: A Capture/Replay tool for observation-based testing</title>
    <link>http://www.citeulike.org/user/V/article/2682599</link>
    <description>&lt;i&gt;SIGSOFT Softw. Eng. Notes, Vol. 25, No. 5. (September 2000), pp. 158-167.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We describe the design of jRapture: a tool for capturing and replaying Java program executions in the field. jRapture works with Java binaries (byte code) and any compliant implementation of the Java virtual machine. It employs a lightweight, transparent capture process that permits unobtrusive capture of a Java programs executions. jRapture captures interactions between a Java program and the system, including GUI, file, and console inputs, among other types, and on replay it presents each thread with exactly the same input sequence it saw during capture. In addition, jRapture has a profiling interface that permits a Java program to be instrumented for profiling ó after its executions have been captured. Using an XML-based profiling specification language a tester can specify various forms of profiling to be carried out during replay.</description>
    <dc:title>jRapture: A Capture/Replay tool for observation-based testing</dc:title>

    <dc:creator>John Steven</dc:creator>
    <dc:creator>Pravir Chandra</dc:creator>
    <dc:creator>Bob Fleck</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:identifier>doi:10.1145/347636.348993</dc:identifier>
    <dc:source>SIGSOFT Softw. Eng. Notes, Vol. 25, No. 5. (September 2000), pp. 158-167.</dc:source>
    <dc:date>2008-04-17T15:48:56-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publicationName>SIGSOFT Softw. Eng. Notes</prism:publicationName>
    <prism:issn>0163-5948</prism:issn>
    <prism:volume>25</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>158</prism:startingPage>
    <prism:endingPage>167</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>java</prism:category>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682567">
    <title>knnFinder: Fast Near Neighbour Search</title>
    <link>http://www.citeulike.org/user/V/article/2682567</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>knnFinder: Fast Near Neighbour Search</dc:title>

    <dc:creator>Samuel Kemp</dc:creator>
    <dc:date>2008-04-17T15:35:28-00:00</dc:date>
    <prism:category>eecs435</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>rpkg</prism:category>
    <prism:category>tool</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682535">
    <title>R: A Language and Environment for Statistical Computing</title>
    <link>http://www.citeulike.org/user/V/article/2682535</link>
    <description>&lt;i&gt;(2008)&lt;/i&gt;</description>
    <dc:title>R: A Language and Environment for Statistical Computing</dc:title>

    <dc:creator>R Development Core Team</dc:creator>
    <dc:source>(2008)</dc:source>
    <dc:date>2008-04-17T15:27:51-00:00</dc:date>
    <prism:publicationYear>2008</prism:publicationYear>
    <prism:category>eecs435</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>tool</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682512">
    <title>GCC, the GNU Compiler Collection</title>
    <link>http://www.citeulike.org/user/V/article/2682512</link>
    <description>&lt;i&gt;&lt;/i&gt;</description>
    <dc:title>GCC, the GNU Compiler Collection</dc:title>

    <dc:creator>GNU Project</dc:creator>
    <dc:date>2008-04-17T15:23:36-00:00</dc:date>
    <prism:category>dataset</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682508">
    <title>Jacks Project</title>
    <link>http://www.citeulike.org/user/V/article/2682508</link>
    <description>&lt;i&gt;(2002)&lt;/i&gt;</description>
    <dc:title>Jacks Project</dc:title>

    <dc:creator>The Mauve Project</dc:creator>
    <dc:source>(2002)</dc:source>
    <dc:date>2008-04-17T15:21:30-00:00</dc:date>
    <prism:publicationYear>2002</prism:publicationYear>
    <prism:category>dataset</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>java</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682339">
    <title>Java 2 Platform, Standard Edition 1.3</title>
    <link>http://www.citeulike.org/user/V/article/2682339</link>
    <description>&lt;i&gt;(1998-2000)&lt;/i&gt;</description>
    <dc:title>Java 2 Platform, Standard Edition 1.3</dc:title>

    <dc:source>(1998-2000)</dc:source>
    <dc:date>2008-04-17T15:15:28-00:00</dc:date>
    <prism:category>dataset</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>java</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682323">
    <title>JTidy</title>
    <link>http://www.citeulike.org/user/V/article/2682323</link>
    <description>&lt;i&gt;(1998-2000)&lt;/i&gt;</description>
    <dc:title>JTidy</dc:title>

    <dc:source>(1998-2000)</dc:source>
    <dc:date>2008-04-17T15:12:59-00:00</dc:date>
    <prism:category>dataset</prism:category>
    <prism:category>fse08</prism:category>
    <prism:category>issre07</prism:category>
    <prism:category>java</prism:category>
    <prism:category>proposal</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682305">
    <title>Estimation of software reliability by stratified sampling</title>
    <link>http://www.citeulike.org/user/V/article/2682305</link>
    <description>&lt;i&gt;ACM Trans. Softw. Eng. Methodol., Vol. 8, No. 3. (July 1999), pp. 263-283.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A new approach to software reliability estimation is presented that combines operational testing with stratified sampling in order to reduce the number of program executions that must be checked manually for conformance to requirements. Automatic cluster analysis is applied to execution profiles in order to stratify captured operational executions. Experimental results are reported that suggest this approach can significantly reduce the cost of estimating reliability.</description>
    <dc:title>Estimation of software reliability by stratified sampling</dc:title>

    <dc:creator>Andy Podgurski</dc:creator>
    <dc:creator>Wassim Masri</dc:creator>
    <dc:creator>Yolanda Mccleese</dc:creator>
    <dc:creator>Francis Wolff</dc:creator>
    <dc:creator>Charles Yang</dc:creator>
    <dc:identifier>doi:10.1145/310663.310667</dc:identifier>
    <dc:source>ACM Trans. Softw. Eng. Methodol., Vol. 8, No. 3. (July 1999), pp. 263-283.</dc:source>
    <dc:date>2008-04-17T15:06:29-00:00</dc:date>
    <prism:publicationYear>1999</prism:publicationYear>
    <prism:publicationName>ACM Trans. Softw. Eng. Methodol.</prism:publicationName>
    <prism:volume>8</prism:volume>
    <prism:number>3</prism:number>
    <prism:startingPage>263</prism:startingPage>
    <prism:endingPage>283</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>reliability</prism:category>
    <prism:category>statistics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2682285">
    <title>Selective capture and replay of program executions</title>
    <link>http://www.citeulike.org/user/V/article/2682285</link>
    <description>&lt;i&gt;(2005), pp. 1-7.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we present a technique for selective capture and replay of program executions. Given an application, the technique allows for (1) selecting a subsystem of interest, (2) capturing at runtime all the interactions between such subsystem and the rest of the application, and (3) replaying the recorded interactions on the subsystem in isolation. The technique can be used in several scenarios. For example, it can be used to generate test cases from users' executions, by capturing and collecting partial executions in the field. For another example. it can be used to perform expensive dynamic analyses off-line. For yet another example, it can be used to extract subsystem or unit tests from system tests. Our technique is designed to be efficient, in that we only capture information that is relevant to the considered execution. To this end, we disregard all data that, although flowing through the boundary of the subsystem of interest, do not affect the execution. In the paper, we also present a preliminary evaluation of the technique performed using SCARPE, a prototype tool that implements our approach.</description>
    <dc:title>Selective capture and replay of program executions</dc:title>

    <dc:creator>Alessandro Orso</dc:creator>
    <dc:creator>Bryan Kennedy</dc:creator>
    <dc:identifier>doi:10.1145/1083246.1083251</dc:identifier>
    <dc:source>(2005), pp. 1-7.</dc:source>
    <dc:date>2008-04-17T15:00:40-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:startingPage>1</prism:startingPage>
    <prism:endingPage>7</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>obt</prism:category>
    <prism:category>profiling</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2678768">
    <title>Economic perspectives in test automation: balancing automated and manual testing with opportunity cost</title>
    <link>http://www.citeulike.org/user/V/article/2678768</link>
    <description>&lt;i&gt;(2006), pp. 85-91.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Testing is a major cost factor in software development. Test automation has been proposed as one solution to reduce these costs. Test automation tools promise to increase the number of tests they run and the frequency at which they run them. So why not automate every test? In this paper we discuss the question &#34;When should a test be automated?&#34; and the trade-off between automated and manual testing. We reveal problems in the overly simplistic cost models commonly used to make decisions about automating testing. We introduce an alternative model based on opportunity cost and present influencing factors on the decision of whether or not to invest in test automation. Our aim is to stimulate discussion about these factors as well as their influence on the benefits and costs of automated testing in order to support researchers and practitioners reflecting on proposed automation approaches.</description>
    <dc:title>Economic perspectives in test automation: balancing automated and manual testing with opportunity cost</dc:title>

    <dc:creator>Rudolf Ramler</dc:creator>
    <dc:creator>Klaus Wolfmaier</dc:creator>
    <dc:identifier>doi:10.1145/1138929.1138946</dc:identifier>
    <dc:source>(2006), pp. 85-91.</dc:source>
    <dc:date>2008-04-16T19:14:11-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>85</prism:startingPage>
    <prism:endingPage>91</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>automation</prism:category>
    <prism:category>economics</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/745875">
    <title>Bug isolation via remote program sampling</title>
    <link>http://www.citeulike.org/user/V/article/745875</link>
    <description>&lt;i&gt;(2003), pp. 141-154.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We propose a low-overhead sampling infrastructure for gathering information from the executions experienced by a program's user community. Several example applications illustrate ways to use sampled instrumentation to isolate bugs. Assertion-dense code can be transformed to share the cost of assertions among many users. Lacking assertions, broad guesses can be made about predicates that predict program errors and a process of elimination used to whittle these down to the true bug. Finally, even for non-deterministic bugs such as memory corruption, statistical modeling based on logistic regression allows us to identify program behaviors that are strongly correlated with failure and are therefore likely places to look for the error.</description>
    <dc:title>Bug isolation via remote program sampling</dc:title>

    <dc:creator>Ben Liblit</dc:creator>
    <dc:creator>Alex Aiken</dc:creator>
    <dc:creator>Alice Zheng</dc:creator>
    <dc:creator>Michael Jordan</dc:creator>
    <dc:identifier>doi:10.1145/781131.781148</dc:identifier>
    <dc:source>(2003), pp. 141-154.</dc:source>
    <dc:date>2006-07-07T14:31:20-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:issn>0362-1340</prism:issn>
    <prism:startingPage>141</prism:startingPage>
    <prism:endingPage>154</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2679226">
    <title>Tree-based methods for classifying software failures</title>
    <link>http://www.citeulike.org/user/V/article/2679226</link>
    <description>&lt;i&gt;Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on (2004), pp. 451-462.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Recent research has addressed the problem of providing automated assistance to software developers in classifying reported instances of software failures so that failures with the same cause are grouped together. In this paper, two new tree-based techniques are presented for refining an initial classification of failures. One of these techniques is based on the use of dendrograms, which are rooted trees used to represent the results of hierarchical cluster analysis. The second technique employs a classification tree constructed to recognize failed executions. With both techniques, the tree representation is used to guide the refinement process. We also report the results of experimentally evaluating these techniques on several subject programs.</description>
    <dc:title>Tree-based methods for classifying software failures</dc:title>

    <dc:creator>P Francis</dc:creator>
    <dc:creator>D Leon</dc:creator>
    <dc:creator>M Minch</dc:creator>
    <dc:creator>A Podgurski</dc:creator>
    <dc:identifier>doi:10.1109/ISSRE.2004.43</dc:identifier>
    <dc:source>Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on (2004), pp. 451-462.</dc:source>
    <dc:date>2008-04-17T00:22:12-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on</prism:publicationName>
    <prism:startingPage>451</prism:startingPage>
    <prism:endingPage>462</prism:endingPage>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2679215">
    <title>A comparison of coverage-based and distribution-based techniques for filtering and prioritizing test cases</title>
    <link>http://www.citeulike.org/user/V/article/2679215</link>
    <description>&lt;i&gt;Software Reliability Engineering, 2003. ISSRE 2003. 14th International Symposium on (2003), pp. 442-453.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper presents an empirical comparison of four different techniques for filtering large test suites: test suite minimization, prioritization by additional coverage, cluster filtering with one-per-cluster sampling, and failure pursuit sampling. The first two techniques are based on selecting subsets that maximize code coverage as quickly as possible, while the latter two are based on analyzing the distribution of the tests' execution profiles. These techniques were compared with data sets obtained from three large subject programs: the GCC, Jikes, and javac compilers. The results indicate that distribution-based techniques can be as efficient or more efficient for revealing defects than coverage-based techniques, but that the two kinds of techniques are also complementary in the sense that they find different defects. Accordingly, some simple combinations of these techniques were evaluated for use in test case prioritization. The results indicate that these techniques can create more efficient prioritizations than those generated using prioritization by additional coverage.</description>
    <dc:title>A comparison of coverage-based and distribution-based techniques for filtering and prioritizing test cases</dc:title>

    <dc:creator>D Leon</dc:creator>
    <dc:creator>A Podgurski</dc:creator>
    <dc:identifier>doi:10.1109/ISSRE.2003.1251065</dc:identifier>
    <dc:source>Software Reliability Engineering, 2003. ISSRE 2003. 14th International Symposium on (2003), pp. 442-453.</dc:source>
    <dc:date>2008-04-17T00:15:59-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:publicationName>Software Reliability Engineering, 2003. ISSRE 2003. 14th International Symposium on</prism:publicationName>
    <prism:startingPage>442</prism:startingPage>
    <prism:endingPage>453</prism:endingPage>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253110">
    <title>Detecting and debugging insecure information flows</title>
    <link>http://www.citeulike.org/user/V/article/2253110</link>
    <description>&lt;i&gt;Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on (2004), pp. 198-209.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;A new approach to dynamic information flow analysis is presented that can be used to detect and debug insecure flows in programs. It can be applied offline to validate and debug a program against an information flow policy, or, when fast response is not critical, it can be applied online to prevent illegal flows in deployed programs. Since dynamic analysis alone is inherently unable to detect implicit information flows, our approach incorporates a static preprocessing phase that permits detection of most implicit flows at runtime, in addition to explicit ones. To support interactive debugging of insecure flows, it also incorporates a new forward computing algorithm for dynamic slicing, which is more precise than previous forward computing algorithms and is not restricted to programs with structured control flow. A prototype tool implementing the proposed approach has been developed for Java byte code programs. Case studies in which this tool was applied to several subject programs are described.</description>
    <dc:title>Detecting and debugging insecure information flows</dc:title>

    <dc:creator>W Masri</dc:creator>
    <dc:creator>A Podgurski</dc:creator>
    <dc:creator>D Leon</dc:creator>
    <dc:identifier>doi:10.1109/ISSRE.2004.17</dc:identifier>
    <dc:source>Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on (2004), pp. 198-209.</dc:source>
    <dc:date>2008-01-18T19:41:50-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Software Reliability Engineering, 2004. ISSRE 2004. 15th International Symposium on</prism:publicationName>
    <prism:startingPage>198</prism:startingPage>
    <prism:endingPage>209</prism:endingPage>
    <prism:category>information_flow</prism:category>
    <prism:category>obt</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/259537">
    <title>Dex: a semantic-graph differencing tool for studying changes in large code bases</title>
    <link>http://www.citeulike.org/user/V/article/259537</link>
    <description>&lt;i&gt;Software Maintenance, 2004. Proceedings. 20th IEEE International Conference on (2004), pp. 188-197.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper describes an automated tool called Dex (difference extractor) for analyzing syntactic and semantic changes in large C-language code bases. It is applied to patches obtained from a source code repository, each of which comprises the code changes made to accomplish a particular task. Dex produces summary statistics characterizing these changes for all of the patches that are analyzed. Dex applies a graph differencing algorithm to abstract semantic graphs (ASGs) representing each version. The differences are then analyzed to identify higher-level program changes. We describe the design of Dex, its potential applications, and the results of applying it to analyze bug fixes from the Apache and GCC projects. The results include detailed information about the nature and frequency of missing condition defects in these projects.</description>
    <dc:title>Dex: a semantic-graph differencing tool for studying changes in large code bases</dc:title>

    <dc:creator>S Raghavan</dc:creator>
    <dc:creator>R Rohana</dc:creator>
    <dc:creator>D Leon</dc:creator>
    <dc:creator>A Podgurski</dc:creator>
    <dc:creator>V Augustine</dc:creator>
    <dc:identifier>doi:10.1109/ICSM.2004.1357803</dc:identifier>
    <dc:source>Software Maintenance, 2004. Proceedings. 20th IEEE International Conference on (2004), pp. 188-197.</dc:source>
    <dc:date>2005-07-19T15:04:21-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>Software Maintenance, 2004. Proceedings. 20th IEEE International Conference on</prism:publicationName>
    <prism:startingPage>188</prism:startingPage>
    <prism:endingPage>197</prism:endingPage>
    <prism:category>analysis</prism:category>
    <prism:category>graph_theory</prism:category>
    <prism:category>source</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253101">
    <title>Multivariate visualization in observation-based testing</title>
    <link>http://www.citeulike.org/user/V/article/2253101</link>
    <description>&lt;i&gt;Software Engineering, 2000. Proceedings of the 2000 International Conference on (2000), pp. 116-125.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We explore the use of multivariate visualization techniques to support a new approach to test data selection, called observation-based testing. Applications of multivariate visualization are described, including: evaluating and improving synthetic tests; filtering regression test suites; filtering captured operational executions; comparing test suites; and assessing bug reports. These applications are illustrated by the use of correspondence analysis to analyze test inputs for the GNU GCC compiler</description>
    <dc:title>Multivariate visualization in observation-based testing</dc:title>

    <dc:creator>D Leon</dc:creator>
    <dc:creator>A Podgurski</dc:creator>
    <dc:creator>LJ White</dc:creator>
    <dc:identifier>doi:10.1109/ICSE.2000.870403</dc:identifier>
    <dc:source>Software Engineering, 2000. Proceedings of the 2000 International Conference on (2000), pp. 116-125.</dc:source>
    <dc:date>2008-01-18T19:40:13-00:00</dc:date>
    <prism:publicationYear>2000</prism:publicationYear>
    <prism:publicationName>Software Engineering, 2000. Proceedings of the 2000 International Conference on</prism:publicationName>
    <prism:startingPage>116</prism:startingPage>
    <prism:endingPage>125</prism:endingPage>
    <prism:category>obt</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253086">
    <title>Pursuing failure: the distribution of program failures in a profile space</title>
    <link>http://www.citeulike.org/user/V/article/2253086</link>
    <description>&lt;i&gt;(2001), pp. 246-255.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Observation-based testing calls for analyzing profiles of executions induced by potential test cases, in order to select a subset of executions to be checked for conformance to requirements. A family of techniques for selecting such a subset is evaluated experimentally. These techniques employ automatic cluster analysis to partition executions, and they use various sampling techniques to select executions from clusters. The experimental results support the hypothesis that with appropriate profiling, failures often have unusual profiles that are revealed by cluster analysis. The results also suggest that failures often form small clusters or chains in sparsely-populated areas of the profile space. A form of adaptive sampling called failure-pursuit sampling is proposed for revealing failures in such regions, and this sampling method is evaluated experimentally. The results suggest that failure-pursuit sampling is effective.</description>
    <dc:title>Pursuing failure: the distribution of program failures in a profile space</dc:title>

    <dc:creator>William Dickinson</dc:creator>
    <dc:creator>David Leon</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:identifier>doi:10.1145/503209.503243</dc:identifier>
    <dc:source>(2001), pp. 246-255.</dc:source>
    <dc:date>2008-01-18T19:35:34-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:startingPage>246</prism:startingPage>
    <prism:endingPage>255</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253083">
    <title>Automated support for classifying software failure reports</title>
    <link>http://www.citeulike.org/user/V/article/2253083</link>
    <description>&lt;i&gt;(2003), pp. 465-475.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;This paper proposes automated support for classifying reported software failures in order to facilitate prioritizing them and diagnosing their causes. A classification strategy is presented that involves the use of supervised and unsupervised pattern classification and multivariate visualization. These techniques are applied to profiles of failed executions in order to group together failures with the same or similar causes. The resulting classification is then used to assess the frequency and severity of failures caused by particular defects and to help diagnose those defects. The results of applying the proposed classification strategy to failures of three large subject programs are reported. These results indicate that the strategy can be effective.</description>
    <dc:title>Automated support for classifying software failure reports</dc:title>

    <dc:creator>Andy Podgurski</dc:creator>
    <dc:creator>David Leon</dc:creator>
    <dc:creator>Patrick Francis</dc:creator>
    <dc:creator>Wes Masri</dc:creator>
    <dc:creator>Melinda Minch</dc:creator>
    <dc:creator>Jiayang Sun</dc:creator>
    <dc:creator>Bin Wang</dc:creator>
    <dc:source>(2003), pp. 465-475.</dc:source>
    <dc:date>2008-01-18T19:34:36-00:00</dc:date>
    <prism:publicationYear>2003</prism:publicationYear>
    <prism:startingPage>465</prism:startingPage>
    <prism:endingPage>475</prism:endingPage>
    <prism:publisher>IEEE Computer Society</prism:publisher>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253071">
    <title>Finding failures by cluster analysis of execution profiles</title>
    <link>http://www.citeulike.org/user/V/article/2253071</link>
    <description>&lt;i&gt;(2001), pp. 339-348.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;We experimentally evaluate the effectiveness of using cluster analysis of execution profiles to find failures among the executions induced by a set of potential test cases. We compare several filtering procedures for selecting executions to evaluate for conformance to requirements. Each filtering procedure involves a choice of a sampling strategy and a clustering metric. The results suggest that filtering procedures based on clustering are more effective than simple random sampling for identifying failures in populations of operational executions, with adaptive sampling from clusters being the most effective sampling strategy. The results also suggest that clustering metrics that give extra weight to unusual profile features are most effective. Scatter plots of execution populations, produced by multidimensional scaling, are used to provide intuition for these results.</description>
    <dc:title>Finding failures by cluster analysis of execution profiles</dc:title>

    <dc:creator>William Dickinson</dc:creator>
    <dc:creator>David Leon</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:source>(2001), pp. 339-348.</dc:source>
    <dc:date>2008-01-18T19:31:47-00:00</dc:date>
    <prism:publicationYear>2001</prism:publicationYear>
    <prism:startingPage>339</prism:startingPage>
    <prism:endingPage>348</prism:endingPage>
    <prism:publisher>IEEE Computer Society</prism:publisher>
    <prism:category>obt</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2253067">
    <title>Corroborating User Assessments of Software Behavior to Facilitate Operational Testing</title>
    <link>http://www.citeulike.org/user/V/article/2253067</link>
    <description>&lt;i&gt;Software Reliability, 2007. ISSRE '07. The 18th IEEE International Symposium on (2007), pp. 61-70.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Operational or &#34;beta&#34; testing of software has a number of benefits for software vendors and has become common industry practice. However, ordinary users are more likely to overlook or misreport software problems than experienced software testers are. To compensate for this shortcoming, we present a technique called corroboration-based filtering for corroborating user assessments of individual operational executions for which audit information has been captured for possible offline review. Independent assessments concerning similar executions are pooled by automatically clustering together executions with similar execution profiles. Executions are chosen for review based on their user assessments, the size of the cluster each execution belongs to, and whether the cluster has already been confirmed by developers to contain an actual failure. We explain the rationale for this technique, analyze it probabilistically, and present the results of empirically comparing it to alternative techniques.</description>
    <dc:title>Corroborating User Assessments of Software Behavior to Facilitate Operational Testing</dc:title>

    <dc:creator>Vinay Augustine</dc:creator>
    <dc:creator>Andy Podgurski</dc:creator>
    <dc:identifier>doi:10.1109/ISSRE.2007.7</dc:identifier>
    <dc:source>Software Reliability, 2007. ISSRE '07. The 18th IEEE International Symposium on (2007), pp. 61-70.</dc:source>
    <dc:date>2008-01-18T19:29:43-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Software Reliability, 2007. ISSRE '07. The 18th IEEE International Symposium on</prism:publicationName>
    <prism:startingPage>61</prism:startingPage>
    <prism:endingPage>70</prism:endingPage>
    <prism:category>corroboration</prism:category>
    <prism:category>eecs435</prism:category>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2204598">
    <title>Helping users avoid bugs in GUI applications</title>
    <link>http://www.citeulike.org/user/V/article/2204598</link>
    <description>&lt;i&gt;(2005), pp. 107-116.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this paper, we propose a method to help users avoid bugs in GUI applications. In particular, users would use the application normally and report bugs that they encounter to prevent anyone -- including themselves -- from encountering those bugs again. When a user attempts an action that has led to problems in the past, he/she will receive a warning and will be given the opportunity to abort the action -- thus avoiding the bug altogether and keeping the application stable. Of course, bugs should be fixed eventually by the application developers, but our approach allows application users to collaboratively help each other avoid bugs -- thus making the application more usable in the meantime. We demonstrate this approach using our &#34;Stabilizer&#34; prototype. We also include a preliminary evaluation of the Stabilizer's bug prediction.</description>
    <dc:title>Helping users avoid bugs in GUI applications</dc:title>

    <dc:creator>Amir Michail</dc:creator>
    <dc:creator>Tao Xie</dc:creator>
    <dc:source>(2005), pp. 107-116.</dc:source>
    <dc:date>2008-01-07T18:35:21-00:00</dc:date>
    <prism:publicationYear>2005</prism:publicationYear>
    <prism:startingPage>107</prism:startingPage>
    <prism:endingPage>116</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>proposal</prism:category>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2204587">
    <title>Pruning dynamic slices with confidence</title>
    <link>http://www.citeulike.org/user/V/article/2204587</link>
    <description>&lt;i&gt;(2006), pp. 169-180.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;Given an incorrect value produced during a failed program run (e.g., a wrong output value or a value that causes the program to crash), the backward dynamic slice of the value very frequently captures the faulty code responsible for producing the incorrect value. Although the dynamic slice often contains only a small percentage of the statements executed during the failed program run, the dynamic slice can still be large and thus considerable effort may be required by the programmer to locate the faulty code.In this paper we develop a strategy for pruning the dynamic slice to identify a subset of statements in the dynamic slice that are likely responsible for producing the incorrect value. We observe that some of the statements used in computing the incorrect value may also have been involved in computing correct values (e.g., a value produced by a statement in the dynamic slice of the incorrect value may also have been used in computing a correct output value prior to the incorrect value). For each such executed statement in the dynamic slice, using the value profiles of the executed statements, we compute a confidence value ranging from 0 to 1 - a higher confidence value corresponds to greater likelihood that the execution of the statement produced a correct value. Given a failed run involving execution of a single error, we demonstrate that the pruning of a dynamic slice by excluding only the statements with the confidence value of 1 is highly effective in reducing the size of the dynamic slice while retaining the faulty code in the slice. Our experiments show that the number of distinct statements in a pruned dynamic slice are 1.79 to 190.57 times less than the full dynamic slice. Confidence values also prioritize the statements in the dynamic slice according to the likelihood of them being faulty. We show that examining the statements in the order of increasing confidence values is an effective strategy for reducing the effort of fault location.</description>
    <dc:title>Pruning dynamic slices with confidence</dc:title>

    <dc:creator>Xiangyu Zhang</dc:creator>
    <dc:creator>Neelam Gupta</dc:creator>
    <dc:creator>Rajiv Gupta</dc:creator>
    <dc:source>(2006), pp. 169-180.</dc:source>
    <dc:date>2008-01-07T18:27:30-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:issn>0362-1340</prism:issn>
    <prism:startingPage>169</prism:startingPage>
    <prism:endingPage>180</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>information_flow</prism:category>
    <prism:category>slicing</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2204567">
    <title>An empirical comparison between direct and indirect test result checking approaches</title>
    <link>http://www.citeulike.org/user/V/article/2204567</link>
    <description>&lt;i&gt;(2006), pp. 6-13.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;An oracle in software testing is a mechanism for checking whether the system under test has behaved correctly for any executions. In some situations, oracles are unavailable or too expensive to apply. This is known as the oracle problem. It is crucial to develop techniques to address it, and metamorphic testing (MT) was one of such proposals. This paper conducts a controlled experiment to investigate the cost effectiveness of using MT by 38 testers on three open-source programs. The fault detection capability and time cost of MT are compared with the popular assertion checking method. Our results show that MT is cost-efﬁcient and has potentials for detecting more faults than the assertion checking method.</description>
    <dc:title>An empirical comparison between direct and indirect test result checking approaches</dc:title>

    <dc:creator>Peifeng Hu</dc:creator>
    <dc:creator>Zhenyu Zhang</dc:creator>
    <dc:creator>WK Chan</dc:creator>
    <dc:creator>TH Tse</dc:creator>
    <dc:source>(2006), pp. 6-13.</dc:source>
    <dc:date>2008-01-07T18:19:47-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>6</prism:startingPage>
    <prism:endingPage>13</prism:endingPage>
    <prism:publisher>ACM</prism:publisher>
    <prism:category>sw_engineering</prism:category>
    <prism:category>testing</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/329575">
    <title>Subspace clustering for high dimensional data: a review</title>
    <link>http://www.citeulike.org/user/V/article/329575</link>
    <description>&lt;i&gt;SIGKDD Explor. Newsl., Vol. 6, No. 1. (June 2004), pp. 90-105.&lt;/i&gt;</description>
    <dc:title>Subspace clustering for high dimensional data: a review</dc:title>

    <dc:creator>Lance Parsons</dc:creator>
    <dc:creator>Ehtesham Haque</dc:creator>
    <dc:creator>Huan Liu</dc:creator>
    <dc:identifier>doi:10.1145/1007730.1007731</dc:identifier>
    <dc:source>SIGKDD Explor. Newsl., Vol. 6, No. 1. (June 2004), pp. 90-105.</dc:source>
    <dc:date>2005-09-22T04:58:48-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>SIGKDD Explor. Newsl.</prism:publicationName>
    <prism:volume>6</prism:volume>
    <prism:number>1</prism:number>
    <prism:startingPage>90</prism:startingPage>
    <prism:endingPage>105</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>algorithms</prism:category>
    <prism:category>classification</prism:category>
    <prism:category>data_mining</prism:category>
    <prism:category>high_dimensional_space</prism:category>
    <prism:category>survey</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/2057345">
    <title>Automating Software Failure Reporting: We can only fix those bugs we know about.</title>
    <link>http://www.citeulike.org/user/V/article/2057345</link>
    <description>&lt;i&gt;ACM Queue, Vol. 2, No. 8. (November 2004)&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;There are many ways to measure quality before and after software is released. For commercial and internal-use-only products, the most important measurement is the user’s perception of product quality. Unfortunately, perception is difficult to measure, so companies attempt to quantify it through customer satisfaction surveys and failure/behavioral data collected from its customer base. This article focuses on the problems of capturing failure data from customer sites. To explore the pertinent issues I rely on experience gained from collecting failure data from Windows XP systems, but the problems you are likely to face when developing internal (noncommercial) software should not be dissimilar.</description>
    <dc:title>Automating Software Failure Reporting: We can only fix those bugs we know about.</dc:title>

    <dc:creator>B Murphy</dc:creator>
    <dc:source>ACM Queue, Vol. 2, No. 8. (November 2004)</dc:source>
    <dc:date>2007-12-04T15:17:16-00:00</dc:date>
    <prism:publicationYear>2004</prism:publicationYear>
    <prism:publicationName>ACM Queue</prism:publicationName>
    <prism:volume>2</prism:volume>
    <prism:number>8</prism:number>
    <prism:category>beta_testing</prism:category>
    <prism:category>obt</prism:category>
    <prism:category>statistics</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/1559292">
    <title>Heuristic ranking of java program edits for fault localization</title>
    <link>http://www.citeulike.org/user/V/article/1559292</link>
    <description>&lt;i&gt;(2007), pp. 239-249.&lt;/i&gt;</description>
    <dc:title>Heuristic ranking of java program edits for fault localization</dc:title>

    <dc:creator>Xiaoxia Ren</dc:creator>
    <dc:creator>Barbara Ryder</dc:creator>
    <dc:identifier>doi:10.1145/1273463.1273495</dc:identifier>
    <dc:source>(2007), pp. 239-249.</dc:source>
    <dc:date>2007-08-14T01:47:51-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:startingPage>239</prism:startingPage>
    <prism:endingPage>249</prism:endingPage>
    <prism:publisher>ACM Press</prism:publisher>
    <prism:category>fault_localization</prism:category>
    <prism:category>toread</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/1559288">
    <title>Techniques for Classifying Executions of Deployed Software to Support Software Engineering Tasks</title>
    <link>http://www.citeulike.org/user/V/article/1559288</link>
    <description>&lt;i&gt;Software Engineering, IEEE Transactions on, Vol. 33, No. 5. (2007), pp. 287-304.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;There is an increasing interest in techniques that support analysis and measurement of fielded software systems. These techniques typically deploy numerous instrumented instances of a software system, collect execution data when the instances run in the field, and analyze the remotely collected data to better understand the system's in-the-field behavior. One common need for these techniques is the ability to distinguish execution outcomes (e.g., to collect only data corresponding to some behavior or to determine how often and under which condition a specific behavior occurs). Most current approaches, however, do not perform any kind of classification of remote executions and either focus on easily observable behaviors (e.g., crashes) or assume that outcomes' classifications are externally provided (e.g., by the users). To address the limitations of existing approaches, we have developed three techniques for automatically classifying execution data as belonging to one of several classes. In this paper, we introduce our techniques and apply them to the binary classification of passing and failing behaviors. Our three techniques impose different overheads on program instances and, thus, each is appropriate for different application scenarios. We performed several empirical studies to evaluate and refine our techniques and to investigate the trade-offs among them. Our results show that 1) the first technique can build very accurate models, but requires a complete set of execution data; 2) the second technique produces slightly less accurate models, but needs only a small fraction of the total execution data; and 3) the third technique allows for even further cost reductions by building the models incrementally, but requires some sequential ordering of the software instances' instrumentation.</description>
    <dc:title>Techniques for Classifying Executions of Deployed Software to Support Software Engineering Tasks</dc:title>

    <dc:creator>Murali Haran</dc:creator>
    <dc:creator>Alan Karr</dc:creator>
    <dc:creator>Michael Last</dc:creator>
    <dc:creator>Alessandro Orso</dc:creator>
    <dc:creator>Porter</dc:creator>
    <dc:creator>Ashish Sanil</dc:creator>
    <dc:creator>Sandro Fouche</dc:creator>
    <dc:source>Software Engineering, IEEE Transactions on, Vol. 33, No. 5. (2007), pp. 287-304.</dc:source>
    <dc:date>2007-08-14T01:43:11-00:00</dc:date>
    <prism:publicationYear>2007</prism:publicationYear>
    <prism:publicationName>Software Engineering, IEEE Transactions on</prism:publicationName>
    <prism:volume>33</prism:volume>
    <prism:number>5</prism:number>
    <prism:startingPage>287</prism:startingPage>
    <prism:endingPage>304</prism:endingPage>
    <prism:category>beta_testing</prism:category>
    <prism:category>classification</prism:category>
    <prism:category>sw_engineering</prism:category>
</item>



<item rdf:about="http://www.citeulike.org/user/V/article/1559277">
    <title>Geometric Basis of Semi-supervised Learning</title>
    <link>http://www.citeulike.org/user/V/article/1559277</link>
    <description>&lt;i&gt;(2006), pp. 209-226.&lt;/i&gt;&lt;br /&gt;&lt;br /&gt;In this chapter, we present an algorithmic framework for semi-supervised inference based on geometric properties of probability distributions. Our approach brings together Laplacian-based spectral techniques, regularization with kernel methods, and algorithms for manifold learning. This framework provides a natural semi-supervised extension for kernel methods and resolves the problem of out-of-sample inference in graph-based transduction. We discuss an interpretation in terms of a family of globally defined data-dependent kernels and also address unsupervised learning (clustering and data representation) within the same framework. Our algorithms effectively exploit both manifold and cluster assumptions to demonstrate state-of-the-art performance on various classification tasks. This chapter also reviews other recent work on out-of-sample extension for transductive graph-based methods.</description>
    <dc:title>Geometric Basis of Semi-supervised Learning</dc:title>

    <dc:creator>Vikas Sindhwani</dc:creator>
    <dc:creator>Misha Belkin</dc:creator>
    <dc:creator>Partha Niyogi</dc:creator>
    <dc:source>(2006), pp. 209-226.</dc:source>
    <dc:date>2007-08-14T01:35:36-00:00</dc:date>
    <prism:publicationYear>2006</prism:publicationYear>
    <prism:startingPage>209</prism:startingPage>
    <prism:endingPage>226</prism:endingPage>
    <prism:publisher>MIT Press</prism:publisher>
    <prism:category>semi-supervised_learning</prism:category>
</item>



</rdf:RDF>

