@inproceedings{midtgaard-etal-2025-ltg,
title = "{LTG} at {V}ar{D}ial 2025 {N}or{SID}: More and Better Training Data for Slot and Intent Detection",
author = "Midtgaard, Marthe and
M{\ae}hlum, Petter and
Scherrer, Yves",
editor = "Scherrer, Yves and
Jauhiainen, Tommi and
Ljube{\v{s}}i{\'c}, Nikola and
Nakov, Preslav and
Tiedemann, Jorg and
Zampieri, Marcos",
booktitle = "Proceedings of the 12th Workshop on NLP for Similar Languages, Varieties and Dialects",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.vardial-1.15/",
pages = "200--208",
abstract = "This paper describes the LTG submission to the VarDial 2025 shared task, where we participate in the Norwegian slot and intent detection subtasks. The shared task focuses on Norwegian dialects, which present challenges due to their low-resource nature and variation. We test a variety of neural models and training data configurations, with the focus on improving and extending the available Norwegian training data. This includes automatically re-aligning slot spans in Norwegian Bokm{\r{a}}l, as well as re-translating the original English training data into both Bokm{\r{a}}l and Nynorsk. {\%} to address dialectal diversity. We also re-annotate an external Norwegian dataset to augment the training data. Our best models achieve first place in both subtasks, achieving an span F1 score of 0.893 for slot filling and an accuracy of 0.980 for intent detection. Our results indicate that while translation quality is less critical, improving the slot labels has a notable impact on slot performance. Moreover, adding more standard Norwegian data improves performance, but incorporating even small amounts of dialectal data leads to greater gains."
}
Markdown (Informal)
[LTG at VarDial 2025 NorSID: More and Better Training Data for Slot and Intent Detection](https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.vardial-1.15/) (Midtgaard et al., VarDial 2025)
ACL