@inproceedings{pokharel-etal-2025-capo,
title = "{CAPO}: Confidence Aware Preference Optimization Learning for Multilingual Preferences",
author = "Pokharel, Rhitabrat and
Tao, Yufei and
Agrawal, Ameeta",
editor = "Inui, Kentaro and
Sakti, Sakriani and
Wang, Haofen and
Wong, Derek F. and
Bhattacharyya, Pushpak and
Banerjee, Biplab and
Ekbal, Asif and
Chakraborty, Tanmoy and
Singh, Dhirendra Pratap",
booktitle = "Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics",
month = dec,
year = "2025",
address = "Mumbai, India",
publisher = "The Asian Federation of Natural Language Processing and The Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.findings-ijcnlp.69/",
pages = "1144--1156",
ISBN = "979-8-89176-303-6",
abstract = "Preference optimization is a critical post-training technique used to align large language models (LLMs) with human preferences, typically by fine-tuning on ranked response pairs. While methods like Direct Preference Optimization (DPO) have proven effective in English, they often fail to generalize robustly to multilingual settings. We propose a simple yet effective alternative, Confidence-Aware Preference Optimization (CAPO), which replaces DPO{'}s fixed treatment of preference pairs with a dynamic loss scaling mechanism based on a relative reward. By modulating the learning signal according to the confidence in each preference pair, CAPO enhances robustness to noisy or low-margin comparisons, typically encountered in multilingual text. Empirically, CAPO outperforms existing preference optimization baselines by at least 16{\%} in reward accuracy, and improves alignment by widening the gap between preferred and dispreferred responses across languages."
}Markdown (Informal)
[CAPO: Confidence Aware Preference Optimization Learning for Multilingual Preferences](https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.findings-ijcnlp.69/) (Pokharel et al., Findings 2025)
ACL
- Rhitabrat Pokharel, Yufei Tao, and Ameeta Agrawal. 2025. CAPO: Confidence Aware Preference Optimization Learning for Multilingual Preferences. In Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics, pages 1144–1156, Mumbai, India. The Asian Federation of Natural Language Processing and The Association for Computational Linguistics.