@inproceedings{thirukovalluru-dhingra-2025-geneol,
title = "{G}en{EOL}: Harnessing the Generative Power of {LLM}s for Training-Free Sentence Embeddings",
author = "Thirukovalluru, Raghuveer and
Dhingra, Bhuwan",
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2025",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.findings-naacl.122/",
pages = "2295--2308",
ISBN = "979-8-89176-195-7",
abstract = "Training-free embedding methods directly leverage pretrained large language models (LLMs) to embed text, bypassing the costly and complex procedure of contrastive learning. Previous training-free embedding methods have mainly focused on optimizing embedding prompts and have overlooked the benefits of utilizing the generative abilities of LLMs. We propose a novel method, GenEOL, which uses LLMs to generate diverse transformations of a sentence that preserve its meaning, and aggregates the resulting embeddings of these transformations to enhance the overall sentence embedding. GenEOL significantly outperforms the existing training-free embedding methods by an average of 2.85 points across several LLMs on the sentence semantic text similarity (STS) benchmark. GenEOL also achieves notable gains in clustering, reranking, and pair-classification tasks from the MTEB benchmark. Additionally, GenEOL stabilizes representation quality across LLM layers and remains robust to perturbations of embedding prompts."
}
Markdown (Informal)
[GenEOL: Harnessing the Generative Power of LLMs for Training-Free Sentence Embeddings](https://preview.aclanthology.org/landing_page/2025.findings-naacl.122/) (Thirukovalluru & Dhingra, Findings 2025)
ACL