@inproceedings{hamada-etal-2025-akibanlp,
title = "{A}kiba{NLP}-{TUT}: Injecting Language-Specific Word-Level Noise for Low-Resource Language Translation",
author = "Hamada, Shoki and
Akiba, Tomoyosi and
Tsukada, Hajime",
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Tenth Conference on Machine Translation",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/name-variant-enfa-fane/2025.wmt-1.104/",
doi = "10.18653/v1/2025.wmt-1.104",
pages = "1259--1264",
ISBN = "979-8-89176-341-8",
abstract = "In this paper, we describes our system for the WMT 2025 Low-Resource Indic Language Translation Shared Task.The language directions addressed are Assamese{\ensuremath{\leftrightarrow}}English and Manipuri{\textrightarrow}English.We propose a method to improve translation performance from low-resource languages (LRLs) to English by injecting Language-specific word-level noise into the parallel corpus of a closely related high-resource language (HRL).In the proposed method, word replacements are performed based on edit distance, using vocabulary and frequency information extracted from an LRL monolingual corpus.Experiments conducted on Assamese and Manipuri show that, in the absence of LRL parallel data, the proposed method outperforms both the w/o noise setting and existing approaches. Furthermore, we confirmed that increasing the size of the monolingual corpus used for noise injection leads to improved translation performance."
}Markdown (Informal)
[AkibaNLP-TUT: Injecting Language-Specific Word-Level Noise for Low-Resource Language Translation](https://preview.aclanthology.org/name-variant-enfa-fane/2025.wmt-1.104/) (Hamada et al., WMT 2025)
ACL