@inproceedings{ayari-etal-2010-fine,
title = "Fine-grained Linguistic Evaluation of Question Answering Systems",
author = "Ayari, Sarra El and
Grau, Brigitte and
Ligozat, Anne-Laure",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Maegaard, Bente and
Mariani, Joseph and
Odijk, Jan and
Piperidis, Stelios and
Rosner, Mike and
Tapias, Daniel",
booktitle = "Proceedings of the Seventh International Conference on Language Resources and Evaluation ({LREC}`10)",
month = may,
year = "2010",
address = "Valletta, Malta",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/L10-1359/",
abstract = "Question answering systems are complex systems using natural language processing. Some evaluation campaigns are organized to evaluate such systems in order to propose a classification of systems based on final results (number of correct answers). Nevertheless, teams need to evaluate more precisely the results obtained by their systems if they want to do a diagnostic evaluation. There are no tools or methods to do these evaluations systematically. We present REVISE, a tool for glass box evaluation based on diagnostic of question answering system results."
}
Markdown (Informal)
[Fine-grained Linguistic Evaluation of Question Answering Systems](https://preview.aclanthology.org/jlcl-multiple-ingestion/L10-1359/) (Ayari et al., LREC 2010)
ACL