@inproceedings{subramani-2026-harnessing,
title = "Harnessing the Latent Space: From Steering Vectors to Model Calibrators for Control and Trust",
author = "Subramani, Nishant",
editor = "Elazar, Yanai and
Ettinger, Allyson and
Kassner, Nora and
Ruder, Sebastian",
booktitle = "Proceedings of The Big Picture v2: Crafting a Research Narrative",
month = jul,
year = "2026",
address = "San Diego, CA, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.bigpicture-main.10/",
pages = "119--130",
ISBN = "979-8-89176-416-3",
abstract = "Language models have changed from unreliable text generators to highly-capable large models with trillions of parameters. Capability increases come hand-in-hand with increases in scale, making understanding the internal representations of models more challenging. Since millions of users increasing rely on language models to interact with external tools or make decisions in medium or high-stakes scenarios, we need to establish control over model behavior and know when to trust model outputs. In this paper, we discuss our contributions on harnessing the latent spaces by proposing steering vectors for control and developing latent space-based model calibrators for trust. Together, our contributions help demystify the latent spaces of language models and offer new insights into how to harness model internals to build more trustworthy language technology."
}Markdown (Informal)
[Harnessing the Latent Space: From Steering Vectors to Model Calibrators for Control and Trust](https://preview.aclanthology.org/ingest-acl-workshops/2026.bigpicture-main.10/) (Subramani, BigPicture 2026)
ACL