@inproceedings{seo-etal-2025-feat,
title = "{FEAT}: A Preference Feedback Dataset through a Cost-Effective Auto-Generation and Labeling Framework for {E}nglish {AI} Tutoring",
author = "Seo, Hyein and
Hwang, Taewook and
Lee, Yohan and
Jung, Sangkeun",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.acl-short.45/",
pages = "575--589",
ISBN = "979-8-89176-252-7",
abstract = "In English education tutoring, teacher feedback is essential for guiding students. Recently, AI-based tutoring systems have emerged to assist teachers; however, these systems require high-quality and large-scale teacher feedback data, which is both time-consuming and costly to generate manually. In this study, we propose FEAT, a cost-effective framework for generating teacher feedback, and have constructed three complementary datasets: (1) DIRECT-Manual (DM), where both humans and large language models (LLMs) collaboratively generate high-quality teacher feedback, albeit at a higher cost; (2) DIRECT-Generated (DG), an LLM-only generated, cost-effective dataset with lower quality;, and (3) DIRECT-Augmented (DA), primarily based on DG with a small portion of DM added to enhance quality while maintaining cost-efficiency. Experimental results showed that incorporating a small portion of DM (5{--}10{\%}) into DG leads to superior performance compared to using 100{\%} DM alone."
}
Markdown (Informal)
[FEAT: A Preference Feedback Dataset through a Cost-Effective Auto-Generation and Labeling Framework for English AI Tutoring](https://preview.aclanthology.org/landing_page/2025.acl-short.45/) (Seo et al., ACL 2025)
ACL