@inproceedings{ranaldi-etal-2025-natural,
title = "When natural language is not enough: The limits of in-context learning demonstrations in multilingual reasoning",
author = "Ranaldi, Leonardo and
Haddow, Barry and
Birch, Alexandra",
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2025",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.findings-naacl.412/",
pages = "7369--7396",
ISBN = "979-8-89176-195-7",
abstract = "Previous studies have demonstrated the effectiveness of reasoning methods in eliciting multi-step reasoned answers from Large Language Models (LLMs) by leveraging in-context demonstrations. These methods, exemplified by Chain-of-Thought (CoT) and Program-Aided Language Models (PAL), have been shown to perform well in monolingual contexts, primarily in English. There has, however, been limited exploration of their abilities in other languages.To gain a deeper understanding of the role of reasoning methods for in-context demonstrations, we investigate how well CoT and PAL perform across languages for arithmetic and symbolic reasoning tasks. Our findings indicate that the effectiveness of reasoning methods varies significantly across different languages and models. Specifically, CoT, which relies on natural language demonstrations, tends to be more accurate in high-resource than in low-resource languages. Conversely, the structured nature of PAL demonstrations facilitates multilingual comprehension, enabling LLMs to generate programmatic answers in both high- and low-resource languages and leading to significant performance improvements over CoT concerning the accuracy of the generated responses."
}
Markdown (Informal)
[When natural language is not enough: The limits of in-context learning demonstrations in multilingual reasoning](https://preview.aclanthology.org/fix-sig-urls/2025.findings-naacl.412/) (Ranaldi et al., Findings 2025)
ACL