@inproceedings{mao-etal-2024-dont,
    title = "Don`t Forget Your Reward Values: Language Model Alignment via Value-based Calibration",
    author = "Mao, Xin  and
      Li, Feng-Lin  and
      Xu, Huimin  and
      Zhang, Wei  and
      Chen, Wang  and
      Luu, Anh Tuan",
    editor = "Al-Onaizan, Yaser  and
      Bansal, Mohit  and
      Chen, Yun-Nung",
    booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
    month = nov,
    year = "2024",
    address = "Miami, Florida, USA",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2024.emnlp-main.976/",
    doi = "10.18653/v1/2024.emnlp-main.976",
    pages = "17622--17642"
}