@inproceedings{duan-etal-2025-unveiling,
title = "Unveiling Language Competence Neurons: A Psycholinguistic Approach to Model Interpretability",
author = "Duan, Xufeng and
Zhou, Xinyu and
Xiao, Bei and
Cai, Zhenguang",
editor = "Rambow, Owen and
Wanner, Leo and
Apidianaki, Marianna and
Al-Khalifa, Hend and
Eugenio, Barbara Di and
Schockaert, Steven",
booktitle = "Proceedings of the 31st International Conference on Computational Linguistics",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.677/",
pages = "10148--10157",
abstract = "As large language models (LLMs) advance in their linguistic capacity, understanding how they capture aspects of language competence remains a significant challenge. This study therefore employs psycholinguistic paradigms, which are well-suited for probing deeper cognitive aspects of language processing, to explore neuron-level representations in language model across three tasks: sound-shape association, sound-gender association, and implicit causality. Our findings indicate that while GPT-2-XL struggles with the sound-shape task, it demonstrates human-like abilities in both sound-gender association and implicit causality. Targeted neuron ablation and activation manipulation reveal a crucial relationship: When GPT-2-XL displays a linguistic ability, specific neurons correspond to that competence; conversely, the absence of such an ability indicates a lack of specialized neurons. This study is the first to utilize psycholinguistic experiments to investigate deep language competence at the neuron level, providing a new level of granularity in model interpretability and insights into the internal mechanisms driving language ability in the transformer-based LLM."
}
Markdown (Informal)
[Unveiling Language Competence Neurons: A Psycholinguistic Approach to Model Interpretability](https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.677/) (Duan et al., COLING 2025)
ACL