@inproceedings{skadina-etal-2025-first,
title = "First Steps in Benchmarking {L}atvian in Large Language Models",
author = "Skadina, Inguna and
Bakanovs, Bruno and
Dar{\c{g}}is, Roberts",
editor = "Holdt, {\v{S}}pela Arhar and
Ilinykh, Nikolai and
Scalvini, Barbara and
Bruton, Micaella and
Debess, Iben Nyholm and
Tudor, Crina Madalina",
booktitle = "Proceedings of the Third Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL-2025)",
month = mar,
year = "2025",
address = "Tallinn, Estonia",
publisher = "University of Tartu Library, Estonia",
url = "https://preview.aclanthology.org/landing_page/2025.resourceful-1.22/",
pages = "86--95",
ISBN = "978-9908-53-121-2",
abstract = "The performance of multilingual large language models (LLMs) in low-resource languages, such as Latvian, has been under-explored. In this paper, we investigate the capabilities of several open and commercial LLMs in the Latvian language understanding tasks. We evaluate these models across several well-known benchmarks, such as the Choice of Plausible Alternatives (COPA) and Measuring Massive Multitask Language Understanding (MMLU), which were adapted into Latvian using machine translation. Our results highlight significant variability in model performance, emphasizing the challenges of extending LLMs to low-resource languages. We also analyze the effect of post-editing on machine-translated datasets, observing notable improvements in model accuracy, particularly with BERT-based architectures. We also assess open-source LLMs using the Belebele dataset, showcasing competitive performance from open-weight models when compared to proprietary systems. This study reveals key insights into the limitations of current LLMs in low-resource settings and provides datasets for future benchmarking efforts."
}
Markdown (Informal)
[First Steps in Benchmarking Latvian in Large Language Models](https://preview.aclanthology.org/landing_page/2025.resourceful-1.22/) (Skadina et al., RESOURCEFUL 2025)
ACL
- Inguna Skadina, Bruno Bakanovs, and Roberts Darģis. 2025. First Steps in Benchmarking Latvian in Large Language Models. In Proceedings of the Third Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL-2025), pages 86–95, Tallinn, Estonia. University of Tartu Library, Estonia.