@inproceedings{cavusoglu-coltekin-2026-idiom,
title = "An Idiom Benchmark for {T}urkish",
author = "{\c{C}}avu{\c{s}}o{\u{g}}lu, Ebru and
Coltekin, Cagri",
editor = {Ojha, Atul Kr. and
Mititelu, Verginica Barbu and
Constant, Mathieu and
Stoyanova, Ivelina and
Do{\u{g}}ru{\"o}z, A. Seza and
Rademaker, Alexandre},
booktitle = "Proceedings of the 22nd Workshop on Multiword Expressions ({MWE} 2026)",
month = mar,
year = "2026",
address = "Rabat, Marocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.mwe-1.12/",
pages = "103--109",
ISBN = "979-8-89176-363-0",
abstract = "Despite recent significant advances, idioms, like other forms of figurative language, present a challenge to natural language processing (NLP). Benchmark corpora are essential for improving the current models on understanding idioms. However, such corpora are only available for a limited set of languages. In this paper, we introduce our ongoing work on a benchmark corpus of Turkish idioms. Our corpus is structured for testing both idiom recognition and idiom understanding. The corpus is currently consists of 200 instances with sentences including idiomatic use, their literal paraphrases, similar sentences with no entailment, and non-idiomatic use of the idiomatic expressions when possible. We describe the methodology used to create the corpus, as well as initial experiments with a selection of LLMs."
}Markdown (Informal)
[An Idiom Benchmark for Turkish](https://preview.aclanthology.org/ingest-eacl/2026.mwe-1.12/) (Çavuşoğlu & Coltekin, MWE 2026)
ACL
- Ebru Çavuşoğlu and Cagri Coltekin. 2026. An Idiom Benchmark for Turkish. In Proceedings of the 22nd Workshop on Multiword Expressions (MWE 2026), pages 103–109, Rabat, Marocco. Association for Computational Linguistics.