@inproceedings{zhang-etal-2016-inducing,
title = "Inducing Bilingual Lexica From Non-Parallel Data With Earth Mover`s Distance Regularization",
author = "Zhang, Meng and
Liu, Yang and
Luan, Huanbo and
Liu, Yiqun and
Sun, Maosong",
editor = "Matsumoto, Yuji and
Prasad, Rashmi",
booktitle = "Proceedings of {COLING} 2016, the 26th International Conference on Computational Linguistics: Technical Papers",
month = dec,
year = "2016",
address = "Osaka, Japan",
publisher = "The COLING 2016 Organizing Committee",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/C16-1300/",
pages = "3188--3198",
abstract = "Being able to induce word translations from non-parallel data is often a prerequisite for cross-lingual processing in resource-scarce languages and domains. Previous endeavors typically simplify this task by imposing the one-to-one translation assumption, which is too strong to hold for natural languages. We remove this constraint by introducing the Earth Mover`s Distance into the training of bilingual word embeddings. In this way, we take advantage of its capability to handle multiple alternative word translations in a natural form of regularization. Our approach shows significant and consistent improvements across four language pairs. We also demonstrate that our approach is particularly preferable in resource-scarce settings as it only requires a minimal seed lexicon."
}
Markdown (Informal)
[Inducing Bilingual Lexica From Non-Parallel Data With Earth Mover’s Distance Regularization](https://preview.aclanthology.org/jlcl-multiple-ingestion/C16-1300/) (Zhang et al., COLING 2016)
ACL