@inproceedings{rognan-beekhuizen-2025-discovery,
title = "A discovery procedure for synlexification patterns in the world{'}s languages",
author = "Rognan, Hannah S. and
Beekhuizen, Barend",
editor = "Hahn, Michael and
Rani, Priya and
Kumar, Ritesh and
Shcherbakov, Andreas and
Sorokin, Alexey and
Serikov, Oleg and
Cotterell, Ryan and
Vylomova, Ekaterina",
booktitle = "Proceedings of the 7th Workshop on Research in Computational Linguistic Typology and Multilingual NLP",
month = aug,
year = "2025",
address = "Vinenna. Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.sigtyp-1.12/",
pages = "93--113",
ISBN = "979-8-89176-281-7",
abstract = "Synlexification is the pattern of crosslinguistic lexical semantic variation whereby what is expressed in a single word in one language, is expressed in multiple words in another (e.g., French `monter' vs. English `go+up'). We introduce a computational method for automatically extracting instances of synlexification from a parallel corpus at a large scale (many languages, many domains). The method involves debiasing the seed language by splitting up synlexifications in the seed language where other languages consistently split them. The method was applied to a massively parallel corpus of 198 Bible translations. We validate it on a broad sample of cases, and demonstrate its potential for typological research."
}
Markdown (Informal)
[A discovery procedure for synlexification patterns in the world’s languages](https://preview.aclanthology.org/landing_page/2025.sigtyp-1.12/) (Rognan & Beekhuizen, SIGTYP 2025)
ACL