@inproceedings{dewan-rifat-2025-pybhasha,
title = "{P}y{B}hasha at {BLP}-2025 Task 2: Effectiveness of Semantic-Aware Translation and Ensembling in {B}angla Code Generation",
author = "Dewan, Foyez Ahmed and
Rifat, Nahid Montasir",
editor = "Alam, Firoj and
Kar, Sudipta and
Chowdhury, Shammur Absar and
Hassan, Naeemul and
Prince, Enamul Hoque and
Tasnim, Mohiuddin and
Rony, Md Rashad Al Hasan and
Rahman, Md Tahmid Rahman",
booktitle = "Proceedings of the Second Workshop on Bangla Language Processing (BLP-2025)",
month = dec,
year = "2025",
address = "Mumbai, India",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.banglalp-1.64/",
pages = "624--628",
ISBN = "979-8-89176-314-2",
abstract = "In this paper, we present our submission to Task 2 of the BLP-2025 shared task on code generation from Bangla instructions. Our approach focused on enhancing instruction quality through translation and improving model performance with a two-stage ensemble strategy. We evaluated two proprietary and several open-source models under three instruction settings: original Bangla instructions, Bangla instructions translated into English using Facebook NLLB, and instructions rewritten in English with GPT-4.1. Experimental results showed that GPT-4.1-rewritten instructions consistently achieved the highest accuracy across models. For final predictions, we used a two-stage ensemble, achieving a $\textit{pass@1}$ score of $\textbf{80.0\%}$ on the hidden test set and securing 12th place on the official leaderboard. Additionally, we conducted a qualitative analysis of selected translations to illustrate how variations in instruction phrasing influenced model outputs."
}Markdown (Informal)
[PyBhasha at BLP-2025 Task 2: Effectiveness of Semantic-Aware Translation and Ensembling in Bangla Code Generation](https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.banglalp-1.64/) (Dewan & Rifat, BanglaLP 2025)
ACL