@inproceedings{wang-wu-2026-diagnose,
title = "Diagnose, Then Repair: A Two-Stage {MQM}-Guided Post-Editing Framework for Domain-Specific Machine Translation",
author = "Wang, Ji Hun and
Wu, Siyu",
editor = "Li, Yunyao and
Rehm, Georg and
Tu, Mei",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL} 2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-industry.115/",
pages = "1683--1698",
ISBN = "979-8-89176-394-4",
abstract = "LLM-based machine translation evaluation can closely match human judgments, but in practice it remains largely diagnostic, with the signals rarely translating into direct quality improvements under real production constraints. We propose a two-stage, evaluator-guided automatic post-editing framework that turns MQM-style evaluation into targeted repairs: a retrieval-augmented LLM evaluator outputs structured, span-level MQM diagnoses under an explicit edit contract, and a separate LLM post-editor applies minimal edits restricted to those diagnoses. This separation improves controllability and reduces paraphrastic drift compared to one-stage ``judge-and-refine'' baselines. In a systematic study involving seven LLMs spanning three model providers and seven languages, our best configuration consistently improves both reference-based COMET and CometKiwi scores over one-stage post-edit methods, while the evaluator{'}s error spans and severities show strong agreement with human MQM annotations and human editor preferences."
}Markdown (Informal)
[Diagnose, Then Repair: A Two-Stage MQM-Guided Post-Editing Framework for Domain-Specific Machine Translation](https://preview.aclanthology.org/ingest-acl/2026.acl-industry.115/) (Wang & Wu, ACL 2026)
ACL