@inproceedings{nagata-tanaka-ishii-2025-new,
title = "A New Formulation of {Z}ipf{'}s Meaning-Frequency Law through Contextual Diversity",
author = "Nagata, Ryo and
Tanaka-Ishii, Kumiko",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.744/",
pages = "15323--15335",
ISBN = "979-8-89176-251-0",
abstract = "This paper proposes formulating Zipf{'}s meaning-frequency law, the power law between word frequency and the number of meanings, as a relationship between word frequency and contextual diversity. The proposed formulation quantifies meaning counts as contextual diversity, which is based on the directions of contextualized word vectors obtained from a Language Model (LM). This formulation gives a new interpretation to the law and also enables us to examine it for a wider variety of words and corpora than previous studies have explored. In addition, this paper shows that the law becomes unobservable when the size of the LM used is small and that autoregressive LMs require much more parameters than masked LMs to be able to observe the law."
}
Markdown (Informal)
[A New Formulation of Zipf’s Meaning-Frequency Law through Contextual Diversity](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.744/) (Nagata & Tanaka-Ishii, ACL 2025)
ACL