@InProceedings{FrancescoBrughi2014, author="Francesco Brughi and Debora Gil and Lloren{\c{c}} Badiella and Eva Jove Casabella and Oriol Ramos Terrades", title="Exploring the impact of inter-query variability on the performance of retrieval systems", booktitle="11th International Conference on Image Analysis and Recognition", year="2014", publisher="Springer International Publishing", volume="8814", pages="413--420", abstract="This paper introduces a framework for evaluating the performance of information retrieval systems. Current evaluation metrics provide an average score that does not consider performance variability across the query set. In this manner, conclusions lack of any statistical significance, yielding poor inference to cases outside the query set and possibly unfair comparisons. We propose to apply statistical methods in order to obtain a more informative measure for problems in which different query classes can be identified. In this context, we assess the performance variability on two levels: overall variability across the whole query set and specific query class-related variability. To this end, we estimate confidence bands for precision-recall curves, and we apply ANOVA in order to assess the significance of the performance across different query classes.", optnote="IAM; DAG; 600.060; 600.061; 600.077; 600.075", optnote="exported from refbase (http://refbase.cvc.uab.es/show.php?record=2559), last updated on Thu, 10 Nov 2016 12:21:18 +0100", isbn="978-3-319-11757-7", issn="0302-9743", doi="10.1007/978-3-319-11758-4_45", file=":http://refbase.cvc.uab.es/files/BGB2014.pdf:PDF" }