@inproceedings{gipiskis-kurasova-2026-evaluation,
title = "Evaluation Cards for {XAI} Metrics",
author = "Gipi{\v{s}}kis, Rokas and
Kurasova, Olga",
editor = "Akhtar, Mubashara and
Batzner, Jan and
Choshen, Leshem and
Ghosh, Avijit and
Gohar, Usman and
Mickel, Jennifer and
Pant, Ichhya and
Talat, Zeerak and
Lin, Michelle",
booktitle = "Proceedings of the Workshop on Evaluating Evaluations ({E}val{E}val)",
month = jul,
year = "2026",
address = "San Diego, CA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.evaleval-1.39/",
pages = "245--251",
ISBN = "979-8-89176-429-3",
abstract = "The evaluation of explainable AI (XAI) methods is affected by a lack of standardization. Metrics are inconsistently defined, incompletely reported, and rarely validated against common baselines. In this paper, we identify transparency of evaluation reporting as a central, under-addressed problem. We propose the XAI Evaluation Card, a documentation template analogous to model cards, designed to accompany any study that introduces an XAI evaluation metric. The card covers explicit declaration of target properties, grounding levels, metric assumptions, validation evidence, gaming risks, and known failure cases. We argue that adopting this template as a community norm would reduce evaluation fragmentation, support meta-analysis, and improve accountability in XAI research."
}Markdown (Informal)
[Evaluation Cards for XAI Metrics](https://preview.aclanthology.org/ingest-acl-workshops/2026.evaleval-1.39/) (Gipiškis & Kurasova, EvalEval 2026)
ACL
- Rokas Gipiškis and Olga Kurasova. 2026. Evaluation Cards for XAI Metrics. In Proceedings of the Workshop on Evaluating Evaluations (EvalEval), pages 245–251, San Diego, CA. Association for Computational Linguistics.