@inproceedings{orten-etal-2025-neuron,
title = "Neuron-Level Language Tag Injection Improves Zero-Shot Translation Performance",
author = "Orten, Jay and
Shurtz, Ammon and
Fulda, Nancy and
Richardson, Stephen D.",
editor = "Zhao, Jin and
Wang, Mingyang and
Liu, Zhu",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.acl-srw.13/",
pages = "203--212",
ISBN = "979-8-89176-254-1",
abstract = "Language tagging, a method whereby source and target inputs are prefixed with a unique language token, has become the de facto standard for conditioning Multilingual Neural Machine Translation (MNMT) models on specific language directions. This conditioning can manifest effective zero-shot translation abilities in MT models at scale for many languages. Expanding on previous work, we propose a novel method of language tagging for MNMT, injection, in which the embedded representation of a language token is concatenated to the input of every linear layer. We explore a variety of different tagging methods, with and without injection, showing that injection improves zero-shot translation performance with up to a 2+ BLEU score point gain for certain language directions in our dataset."
}
Markdown (Informal)
[Neuron-Level Language Tag Injection Improves Zero-Shot Translation Performance](https://preview.aclanthology.org/landing_page/2025.acl-srw.13/) (Orten et al., ACL 2025)
ACL