@inproceedings{mousavi-etal-2022-evaluation, title = "Evaluation of Response Generation Models: Shouldn{'}t It Be Shareable and Replicable?", author = "Mousavi, Seyed Mahed and Roccabruna, Gabriel and Lorandi, Michela and Caldarella, Simone and Riccardi, Giuseppe", editor = "Bosselut, Antoine and Chandu, Khyathi and Dhole, Kaustubh and Gangal, Varun and Gehrmann, Sebastian and Jernite, Yacine and Novikova, Jekaterina and Perez-Beltrachini, Laura", booktitle = "Proceedings of the 2nd Workshop on Natural Language Generation, Evaluation, and Metrics (GEM)", month = dec, year = "2022", address = "Abu Dhabi, United Arab Emirates (Hybrid)", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2022.gem-1.12/", doi = "10.18653/v1/2022.gem-1.12", pages = "136--147" }