@inproceedings{li-etal-2026-lending,
title = "Lending Eyesight to Language Models: Modeling and Probing Human scanpath through Transformer Decoder",
author = "Li, Junlin and
Reich, David Robert and
Hsu, Yu-Yin",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1591/",
pages = "31807--31819",
ISBN = "979-8-89176-395-1",
abstract = "Human scanpaths offer rich and reliable clues about the cognitive mechanisms underlying language comprehension. Decoder-only language models, typically large language models (LLMs), have proven to exhibit striking parallels with human cognitive processes. In this study, we investigate to what extent language models can be endowed with human-like gaze shifts. Besides, by probing scanpath through eye model, analogous to probing language through language models, we ask whether such modeling can yield novel knowledge of the cognitive machinery of sense making.This study presents a novel plug-and-play module, EyeLM, to transform an autoregressive language model into an autoregressive eye model, thus facilitating a probabilistic spatial modeling of human explicit attention. Our EyeLM module, powered by LLMs, achieves competitive performance with novel cognitive probing capabilities. By probing EyeLM, we can reach the predictability and uncertainty of the scanpath. Exhibiting aligned patterns with prior knowledge about human reading comprehension, these probabilistic measures of scanpath act as promising predictors of human comprehension skills."
}Markdown (Informal)
[Lending Eyesight to Language Models: Modeling and Probing Human scanpath through Transformer Decoder](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1591/) (Li et al., Findings 2026)
ACL