@inproceedings{nicosia-etal-2021-translate-fill,
title = "{T}ranslate {\&} {F}ill: {I}mproving Zero-Shot Multilingual Semantic Parsing with Synthetic Data",
author = "Nicosia, Massimo and
Qu, Zhongdi and
Altun, Yasemin",
editor = "Moens, Marie-Francine and
Huang, Xuanjing and
Specia, Lucia and
Yih, Scott Wen-tau",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2021",
month = nov,
year = "2021",
address = "Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2021.findings-emnlp.279/",
doi = "10.18653/v1/2021.findings-emnlp.279",
pages = "3272--3284",
abstract = "While multilingual pretrained language models (LMs) fine-tuned on a single language have shown substantial cross-lingual task transfer capabilities, there is still a wide performance gap in semantic parsing tasks when target language supervision is available. In this paper, we propose a novel Translate-and-Fill (TaF) method to produce silver training data for a multilingual semantic parser. This method simplifies the popular Translate-Align-Project (TAP) pipeline and consists of a sequence-to-sequence filler model that constructs a full parse conditioned on an utterance and a view of the same parse. Our filler is trained on English data only but can accurately complete instances in other languages (i.e., translations of the English training utterances), in a zero-shot fashion. Experimental results on three multilingual semantic parsing datasets show that data augmentation with TaF reaches accuracies competitive with similar systems which rely on traditional alignment techniques."
}
Markdown (Informal)
[Translate & Fill: Improving Zero-Shot Multilingual Semantic Parsing with Synthetic Data](https://preview.aclanthology.org/fix-sig-urls/2021.findings-emnlp.279/) (Nicosia et al., Findings 2021)
ACL