@inproceedings{ki-etal-2024-inspecting,
title = "Inspecting Soundness of {AMR} Similarity Metrics in terms of Equivalence and Inequivalence",
author = "Ki, Kyung Seo and
Kim, Bugeun and
Gweon, Gahgene",
editor = "Bollegala, Danushka and
Shwartz, Vered",
booktitle = "Proceedings of the 13th Joint Conference on Lexical and Computational Semantics (*SEM 2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2024.starsem-1.32/",
doi = "10.18653/v1/2024.starsem-1.32",
pages = "402--409",
abstract = "In this study, we investigate soundness of current Abstract Meaning Representation (AMR) similarity metrics in terms of equivalence and inequivalence. Specifically, AMR guidelines provide several equivalence and inequivalence conditions to reflect the meaning aspect of the semantics. Thus, it is important to examine an AMR metric`s soundness, i.e., whether the metric correctly reflects the guidelines. However, the existing metrics have less investigated their soundness. In this work, we propose a new experimental method using simulated data and a series of statistical tests to verify the metric`s soundness. Our experimental result revealed that all existing metrics such as Smatch, SemBLEU, S2match, Smatch++, WWLK-theta, WWLK-k3e2n, and SEMA did not fully meet the AMR guidelines in terms of equivalence and inequivalence aspects. Also, to alleviate this soundness problem, we suggest a revised metric called Smatch{\#}, which adopts simple graph standardization technique that can improve the soundness of an existing metric."
}
Markdown (Informal)
[Inspecting Soundness of AMR Similarity Metrics in terms of Equivalence and Inequivalence](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2024.starsem-1.32/) (Ki et al., *SEM 2024)
ACL