@inproceedings{popovic-farber-2024-embedded,
title = "Embedded Named Entity Recognition using Probing Classifiers",
author = {Popovic, Nicholas and
F{\"a}rber, Michael},
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.emnlp-main.988/",
doi = "10.18653/v1/2024.emnlp-main.988",
pages = "17830--17850",
abstract = "Streaming text generation, has become a common way of increasing the responsiveness of language model powered applications such as chat assistants. At the same time, extracting semantic information from generated text is a useful tool for applications such as automated fact checking or retrieval augmented generation. Currently, this requires either separate models during inference, which increases computational cost, or destructive fine-tuning of the language model. Instead, we propose an approach called EMBER which enables streaming named entity recognition in decoder-only language models without fine-tuning them and while incurring minimal additional computational cost at inference time. Specifically, our experiments show that EMBER maintains high token generation rates, with only a negligible decrease in speed of around 1{\%} compared to a 43.64{\%} slowdown measured for a baseline. We make our code and data available online, including a toolkit for training, testing, and deploying efficient token classification models optimized for streaming text generation."
}
Markdown (Informal)
[Embedded Named Entity Recognition using Probing Classifiers](https://preview.aclanthology.org/fix-sig-urls/2024.emnlp-main.988/) (Popovic & Färber, EMNLP 2024)
ACL