@inproceedings{kellert-tyagi-2025-languages,
title = "Where and How Do Languages Mix? A Study of {S}panish-{G}uaran{\'i} Code-Switching in {P}araguay",
author = "Kellert, Olga and
Tyagi, Nemika",
editor = "Winata, Genta Indra and
Kar, Sudipta and
Zhukova, Marina and
Solorio, Thamar and
Ai, Xi and
Hamed, Injy and
Ihsani, Mahardika Krisna Krisna and
Wijaya, Derry Tanti and
Kuwanto, Garry",
booktitle = "Proceedings of the 7th Workshop on Computational Approaches to Linguistic Code-Switching",
month = may,
year = "2025",
address = "Albuquerque, New Mexico, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.calcs-1.4/",
pages = "26--31",
ISBN = "979-8-89176-053-0",
abstract = "Code-switching, the alternating use of multiple languages within a single utterance, is a widespread linguistic phenomenon that poses unique challenges for both sociolinguistic analysis and Natural Language Processing (NLP). While prior research has explored code-switching from either a syntactic or geographic perspective, few studies have integrated both aspects, particularly for underexplored language pairs like Spanish-Guaran{\'i}. In this paper, we analyze Spanish-Guaran{\'i} code-switching using a dataset of geotagged tweets from Asunci{\'o}n, Paraguay, collected from 2017 to 2021. We employ a differential distribution method to map the geographic distribution of code-switching across urban zones and analyze its syntactic positioning within sentences. Our findings reveal distinct spatial patterns, with Guaran{\'i}-dominant tweets concentrated in the western and southwestern areas, while Spanish-only tweets are more prevalent in central and eastern regions. Syntactic analysis shows that code-switching occurs most frequently in the middle of sentences, often involving verbs, pronouns, and adjectives. These results provide new insights into the interaction between linguistic, social, and geographic factors in bilingual communication. Our study contributes to both sociolinguistic research and NLP applications, offering a framework for analyzing mixed-language data in digital communication."
}
Markdown (Informal)
[Where and How Do Languages Mix? A Study of Spanish-Guaraní Code-Switching in Paraguay](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.calcs-1.4/) (Kellert & Tyagi, CALCS 2025)
ACL