@inproceedings{rueter-partanen-2025-restructuring,
title = "Restructuring and visualising dialect dictionary data: Report on {E}rzya and {M}oksha materials",
author = "Rueter, Jack and
Partanen, Niko",
editor = {H{\"a}m{\"a}l{\"a}inen, Mika and
{\"O}hman, Emily and
Bizzoni, Yuri and
Miyagawa, So and
Alnajjar, Khalid},
booktitle = "Proceedings of the 5th International Conference on Natural Language Processing for Digital Humanities",
month = may,
year = "2025",
address = "Albuquerque, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.nlp4dh-1.5/",
pages = "41--47",
ISBN = "979-8-89176-234-3",
abstract = "There are a number of Uralic dialect dictionaries based on fieldwork documentation of individual minority languages from the Pre-Soviet Era. The first of these published by the Finno-Ugrian Society features the Mordvin languages, Erzya and Moksha.In this article, we describe the possibility of reusing XML dialect dictionary collection point and phonetic variant data for visualizing informative linguistic isoglosses with R programming language{'}s Shiny web application frame-work.We provide a description of the `H. Paasonen Mordvin Dictionary', which will possibly provide the reader with a better perspective of what data and challenges might present themselves in minority language dialect dictionaries.We provide a description of how we processed our data, and then we provide conclusions followed by a more extensive section on limitations. The conclusions state that only some of the data should be rendered with R Shiny web application, whereas some data might be better rendered by other applications.Our limitations section description calls for the extension the dialect dictionary database for a more concise description of the languageforms."
}
Markdown (Informal)
[Restructuring and visualising dialect dictionary data: Report on Erzya and Moksha materials](https://preview.aclanthology.org/fix-sig-urls/2025.nlp4dh-1.5/) (Rueter & Partanen, NLP4DH 2025)
ACL