@inproceedings{anand-dunn-2025-mapping,
title = "Mapping Semantic Domains Across {I}ndia{'}s Social Media: Networks, Geography, and Social Factors",
author = "Anand, Gunjan and
Dunn, Jonathan",
editor = "Evang, Kilian and
Kallmeyer, Laura and
Pogodalla, Sylvain",
booktitle = "Proceedings of the 16th International Conference on Computational Semantics",
month = sep,
year = "2025",
address = {D{\"u}sseldorf, Germany},
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/iwcs-25-ingestion/2025.iwcs-1.28/",
pages = "317--330",
ISBN = "979-8-89176-316-6",
abstract = "This study examines socially-conditioned variation within semantic domains like kinship and weather using thirteen Indian cities as a case-study. Using bilingual social media data, we infer six semantic domains from corpora representing individual cities with a lexicon including terms from English, Hindi and Transliterated Hindi. The process of inferring semantic domains uses character-based embeddings to retrieve nearest neighbors and Jaccard similarity to operationalize the edge weights between lexical items within each domain. These representations reveal distinct regional variation across all six domains. We then examine the relationship between variation in semantic domains and external social factors such as literacy rates and local demographics. The results show that semantic domains exhibit systematic influences from sociolinguistic factors, a finding that has significant implications for the idea that semantic domains can be studied as abstractions distinct from specific speech communities."
}
Markdown (Informal)
[Mapping Semantic Domains Across India’s Social Media: Networks, Geography, and Social Factors](https://preview.aclanthology.org/iwcs-25-ingestion/2025.iwcs-1.28/) (Anand & Dunn, IWCS 2025)
ACL