@inproceedings{su-etal-2024-api,
title = "{API} Is Enough: Conformal Prediction for Large Language Models Without Logit-Access",
author = "Su, Jiayuan and
Luo, Jing and
Wang, Hongwei and
Cheng, Lu",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2024",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Author-page-Marten-During-lu/2024.findings-emnlp.54/",
doi = "10.18653/v1/2024.findings-emnlp.54",
pages = "979--995",
abstract = "This study aims to address the pervasive challenge of quantifying uncertainty in large language models (LLMs) with black-box API access. Conformal Prediction (CP), known for its model-agnostic and distribution-free features, is a desired approach for various LLMs and data distributions. However, existing CP methods for LLMs typically assume access to the logits, which are unavailable for some API-only LLMs. In addition, logits are known to be miscalibrated, potentially leading to degraded CP performance. To tackle these challenges, we introduce a novel CP method that (1) is tailored for API-only LLMs without logit-access; (2) minimizes the size of prediction sets; and (3) ensures a statistical guarantee of the user-defined coverage. The core idea of this approach is to formulate nonconformity measures using both coarse-grained (i.e., sample frequency) and fine-grained uncertainty notions (e.g., semantic similarity). Experimental results on both close-ended and open-ended Question Answering tasks show our approach can mostly outperform the logit-based CP baselines."
}
Markdown (Informal)
[API Is Enough: Conformal Prediction for Large Language Models Without Logit-Access](https://preview.aclanthology.org/Author-page-Marten-During-lu/2024.findings-emnlp.54/) (Su et al., Findings 2024)
ACL