@inproceedings{creanga-dinu-2026-llm,
title = "{LLM}-as-a-Judge for Low-Resource Languages: Adapting Ragas and Comparative Ranking for {R}omanian",
author = "Creanga, Claudiu and
Dinu, Liviu P",
editor = "Hettiarachchi, Hansi and
Ranasinghe, Tharindu and
Plum, Alistair and
Rayson, Paul and
Mitkov, Ruslan and
Gaber, Mohamed and
Premasiri, Damith and
Tan, Fiona Anting and
Uyangodage, Lasitha",
booktitle = "Proceedings of the Second Workshop on Language Models for Low-Resource Languages ({L}o{R}es{LM} 2026)",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/manual-author-scripts/2026.loreslm-1.15/",
pages = "157--167",
ISBN = "979-8-89176-377-7",
abstract = "Evaluating Retrieval-Augmented Generation (RAG) systems remains a challenge for Low-Resource Languages (LRLs), where standard reference-based metrics fall short. This paper investigates the viability of the ``LLM-as-a-Judge'' paradigm for Romanian by adapting the Ragas framework using next-generation models (Gemini 2.5 and Gemini 3). We introduce AdminRo-Eval, a curated dataset of Romanian administrative documents annotated by native speakers, to serve as a ground truth for benchmarking automated evaluators. We compare three evaluation methodologies{---}direct scoring, comparative ranking, and granular decomposition{---}across metrics for Faithfulness, Answer Relevance, and Context Relevance. Our findings reveal that evaluation strategies must be metric-specific: granular decomposition achieves the highest human alignment for Faithfulness (96{\%} with Gemini 2.5 Pro), while comparative ranking outperforms in Answer Relevance (90{\%}). Furthermore, we demonstrate that while lightweight models struggle with complex reasoning in LRLs, the Gemini 2.5 Pro architecture establishes a robust, transferable baseline for automated Romanian RAG evaluation."
}Markdown (Informal)
[LLM-as-a-Judge for Low-Resource Languages: Adapting Ragas and Comparative Ranking for Romanian](https://preview.aclanthology.org/manual-author-scripts/2026.loreslm-1.15/) (Creanga & Dinu, LoResLM 2026)
ACL