@inproceedings{madhurapantula-pulagara-2026-mano,
title = "Mano{\_}sub@{D}ravidian{L}ang{T}ech 2026: Article-Aware Batching and Discriminative Fine-Tuning of {M}u{RIL} for {T}elugu Prompt-Style Classification",
author = "Madhurapantula, Manohar Sita Rama and
Pulagara, Seshu Babu",
editor = "Chakravarthi, Bharathi Raja and
Priyadharshini, Ruba and
Madasamy, Anand Kumar and
Thavareesan, Sajeetha and
Rajiakodi, Saranya and
Navaneethakrishnan, Subalalitha and
Chinnappa, Dhivya and
Palani, Balasubramanian and
Subramanian, Malliga and
Shanmugavadivel, Kogilavani and
Rajalakshmi, Ratnavel",
booktitle = "Proceedings of the Sixth Workshop on Speech, Vision, and Language Technologies for {D}ravidian Languages",
month = jul,
year = "2026",
address = "Underline (Virtual)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.dravidianlangtech-1.45/",
pages = "294--300",
ISBN = "979-8-89176-401-9",
abstract = "This paper presents Team Mano{\_}sub{'}s sub mission to the Telugu Prompt-Style Recovery task at DravidianLangTech 2026, classifying Telugu text into nine stylistic categories: Formal, Informal, Optimistic, Pessimistic, Humorous, Serious, Inspiring, Authoritative, and Persuasive. We identify a critical structural property of the dataset: each of 384 unique source articles appears ap proximately 7.8 times with different style la bels. Standard random batching leads to poor within-batch diversity when same-article samples co-occur, causing majority-class collapse and keeping macro F1 stuck at 0.022 regard less of learning rate. We propose an article aware batch sampler that enforces within-batch article diversity, combined with discriminative learning rates for full MuRIL fine-tuning. Complete five-fold cross-validation yields a mean macro F1 of 0.3834 (std=0.0189) on the development set, with fold best scores ranging from 0.3488 to 0.4040. The fold 1 best model achieves macro F1=0.2765 on the official test set {---}a5.6{\texttimes}improvement over our officially submitted result of F1=0.0491, which would have ranked 2nd among all 13 participating teams. All nine style classes are correctly predicted by epoch 5. Our system is officially ranked 12th in the Prompt Recovery for LLM in Telugu shared task at DravidianLangTech@ACL 2026. Code: https:// github.com/msrmanohar/ACL-PRLLM"
}Markdown (Informal)
[Mano_sub@DravidianLangTech 2026: Article-Aware Batching and Discriminative Fine-Tuning of MuRIL for Telugu Prompt-Style Classification](https://preview.aclanthology.org/ingest-acl-workshops/2026.dravidianlangtech-1.45/) (Madhurapantula & Pulagara, DravidianLangTech 2026)
ACL