@inproceedings{sun-etal-2021-parallel,
title = "Parallel sentences mining with transfer learning in an unsupervised setting",
author = "Sun, Yu and
Zhu, Shaolin and
Yifan, Feng and
Mi, Chenggang",
editor = "Durmus, Esin and
Gupta, Vivek and
Liu, Nelson and
Peng, Nanyun and
Su, Yu",
booktitle = "Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Student Research Workshop",
month = jun,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2021.naacl-srw.17/",
doi = "10.18653/v1/2021.naacl-srw.17",
pages = "136--142",
abstract = "The quality and quantity of parallel sentences are known as very important training data for constructing neural machine translation (NMT) systems. However, these resources are not available for many low-resource language pairs. Many existing methods need strong supervision are not suitable. Although several attempts at developing unsupervised models, they ignore the language-invariant between languages. In this paper, we propose an approach based on transfer learning to mine parallel sentences in the unsupervised setting. With the help of bilingual corpora of rich-resource language pairs, we can mine parallel sentences without bilingual supervision of low-resource language pairs. Experiments show that our approach improves the performance of mined parallel sentences compared with previous methods. In particular, we achieve excellent results at two real-world low-resource language pairs."
}
Markdown (Informal)
[Parallel sentences mining with transfer learning in an unsupervised setting](https://preview.aclanthology.org/add-emnlp-2024-awards/2021.naacl-srw.17/) (Sun et al., NAACL 2021)
ACL