@inproceedings{prasad-etal-2021-extent, title = "To what extent do human explanations of model behavior align with actual model behavior?", author = "Prasad, Grusha and Nie, Yixin and Bansal, Mohit and Jia, Robin and Kiela, Douwe and Williams, Adina", editor = "Bastings, Jasmijn and Belinkov, Yonatan and Dupoux, Emmanuel and Giulianelli, Mario and Hupkes, Dieuwke and Pinter, Yuval and Sajjad, Hassan", booktitle = "Proceedings of the Fourth BlackboxNLP Workshop on Analyzing and Interpreting Neural Networks for NLP", month = nov, year = "2021", address = "Punta Cana, Dominican Republic", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2021.blackboxnlp-1.1/", doi = "10.18653/v1/2021.blackboxnlp-1.1", pages = "1--14" }