@article{martinez-criado-etal-2026-benchmarking,
title = "Benchmarking Mathematical Reasoning in a Low-Resource Language: Structured Prompting and Evaluation in {B}asque",
author = "Martinez-Criado, Inigo and
Soroa, Aitor and
Barnes, Jeremy",
editor = "Piperidis, Stelios and
Bel, N{\'u}ria and
van den Heuvel, Henk and
Ide, Nancy and
Krek, Simon and
Toral, Antonio",
journal = "International Conference on Language Resources and Evaluation",
volume = "main",
month = may,
year = "2026",
address = "Palma de Mallorca, Spain",
publisher = "ELRA Language Resource Association",
url = "https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.412/",
pages = "5268--5289",
abstract = "Large Language Models (LLMs) have shown impressive performance on tasks requiring complex reasoning, but most evaluations tend to focus on English and other high-resource languages. This work investigates how well LLMs perform mathematical reasoning in low-resource languages, using Basque as a primary case study. To support this analysis, we introduce MASEU, a benchmark designed to evaluate reasoning in Basque across arithmetic, algebraic, and logical tasks. We then use this dataset to address three key questions: 1) how well do LLMs support Basque in reasoning tasks, 2) to what extent can including English in prompts improve results, and 3) what is the effect of continued pretraining in Basque? To explore these aspects, we use prompting strategies adapted for mathematical reasoning, building upon the foundations of CoT prompting and one of its subsequent evolutions, DUP prompting, which together allow for more precise experimentation across zero-shot and few-shot settings, providing insights into how multilingual models handle reasoning tasks in underrepresented languages."
}Markdown (Informal)
[Benchmarking Mathematical Reasoning in a Low-Resource Language: Structured Prompting and Evaluation in Basque](https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.412/) (Martinez-Criado et al., LREC 2026)
ACL