@inproceedings{chousa-hirao-2025-automatic,
title = "Automatic Evaluation of Language Generation Technology Based on Structure Alignment",
author = "Chousa, Katsuki and
Hirao, Tsutomu",
editor = "Rambow, Owen and
Wanner, Leo and
Apidianaki, Marianna and
Al-Khalifa, Hend and
Eugenio, Barbara Di and
Schockaert, Steven",
booktitle = "Proceedings of the 31st International Conference on Computational Linguistics",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.512/",
pages = "7663--7670",
abstract = "Language generation techniques require automatic evaluation to carry out efficient and reproducible experiments. While n-gram matching is standard, it fails to capture semantic equivalence with different wording. Recent methods have addressed this issue by using contextual embeddings from pre-trained language models to compute the similarity between reference and hypothesis. However, these methods frequently disregard the syntax of sentences, despite its crucial role in determining meaning, and thus assign unjustifiably high scores. This paper proposes an automatic evaluation metric that considers both the words in sentences and their syntactic structures. We integrate syntactic information into the recent embedding-based approach. Experimental results obtained from two NLP tasks show that our method is at least comparable to standard baselines."
}
Markdown (Informal)
[Automatic Evaluation of Language Generation Technology Based on Structure Alignment](https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.512/) (Chousa & Hirao, COLING 2025)
ACL