@inproceedings{cao-etal-2025-rationalize,
title = "Rationalize and Align: Enhancing Writing Assistance with Rationale via Self-Training for Improved Alignment",
author = "Cao, Hannan and
Ye, Hai and
Ng, Hwee Tou",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2025",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/display_plenaries/2025.findings-acl.1383/",
pages = "26967--26982",
ISBN = "979-8-89176-256-5",
abstract = "A Writing Assistant (WA) is a system that offers writing suggestions based on user instructions. Existing WAs are typically built by training large language models (LLMs) on domain-specific instruction data through supervised fine-tuning (SFT) only. However, SFT optimizes models to match a single reference, failing to capture the inherent flexibility of text editing, where multiple valid revisions exist. Therefore, solely relying on SFT limits WA performance. To address this limitation, we propose the Rationalize and Align framework, which enhances the WA performance with rationale (i.e., linguistic explanations) and alignment. Our framework automatically generates the rationale and preference data for writing tasks via distillation and self-training, eliminating the need for human annotation. These data are then leveraged to refine WA using a novel preference optimization method. Empirical results show that our framework significantly improves WA performance. Our WA outperforms both open-source state-of-the-art WAs and the closed-source GPT-4o by 3.9 and 7.1 points on average, respectively, across eight well-established writing-related test sets."
}
Markdown (Informal)
[Rationalize and Align: Enhancing Writing Assistance with Rationale via Self-Training for Improved Alignment](https://preview.aclanthology.org/display_plenaries/2025.findings-acl.1383/) (Cao et al., Findings 2025)
ACL