@inproceedings{wang-etal-2020-negative,
title = "On Negative Interference in Multilingual Models: Findings and A Meta-Learning Treatment",
author = "Wang, Zirui and
Lipton, Zachary C. and
Tsvetkov, Yulia",
editor = "Webber, Bonnie and
Cohn, Trevor and
He, Yulan and
Liu, Yang",
booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)",
month = nov,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.emnlp-main.359/",
doi = "10.18653/v1/2020.emnlp-main.359",
pages = "4438--4450",
abstract = "Modern multilingual models are trained on concatenated text from multiple languages in hopes of conferring benefits to each (positive transfer), with the most pronounced benefits accruing to low-resource languages. However, recent work has shown that this approach can degrade performance on high-resource languages, a phenomenon known as negative interference. In this paper, we present the first systematic study of negative interference. We show that, contrary to previous belief, negative interference also impacts low-resource languages. While parameters are maximally shared to learn language-universal structures, we demonstrate that language-specific parameters do exist in multilingual models and they are a potential cause of negative interference. Motivated by these observations, we also present a meta-learning algorithm that obtains better cross-lingual transferability and alleviates negative interference, by adding language-specific layers as meta-parameters and training them in a manner that explicitly improves shared layers' generalization on all languages. Overall, our results show that negative interference is more common than previously known, suggesting new directions for improving multilingual representations."
}
Markdown (Informal)
[On Negative Interference in Multilingual Models: Findings and A Meta-Learning Treatment](https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.emnlp-main.359/) (Wang et al., EMNLP 2020)
ACL