@inproceedings{esteve-dobrovoljc-2026-delta,
title = "{DELTA}: A Toolkit for Measuring Linguistic Diversity in Dependency-Parsed Corpora",
author = "Est{\`e}ve, Louis and
Dobrovoljc, Kaja",
editor = "Croce, Danilo and
Leidner, Jochen and
Moosavi, Nafise Sadat",
booktitle = "Proceedings of the 19th Conference of the {E}uropean Chapter of the {A}ssociation for {C}omputational {L}inguistics (Volume 3: System Demonstrations)",
month = mar,
year = "2026",
address = "Rabat, Marocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.eacl-demo.6/",
pages = "75--85",
ISBN = "979-8-89176-382-1",
abstract = "Despite growing interest in measuring linguistic diversity on the one hand and the increasing availability of cross-linguistically comparable parsed corpora on the other, tools for systematically measuring the diversity of specific linguistic phenomena on such data remain limited. To address this gap, we present DELTA, an open-source framework that integrates dependency tree querying with diversity computation, enabling systematic measurement across multiple linguistic levels (e.g., lexis, morphology, syntax) and multiple diversity dimensions (variety, balance, disparity). The pipeline processes CoNLL-U formatted corpora through configurable workflows, treating the format as a general-purpose tabular structure independent of specific annotation conventions. We validate DELTA on Parallel Universal Dependencies multilingual dataset, demonstrating its capacity for corpus profiling and cross-corpus diversity comparison."
}Markdown (Informal)
[DELTA: A Toolkit for Measuring Linguistic Diversity in Dependency-Parsed Corpora](https://preview.aclanthology.org/ingest-eacl/2026.eacl-demo.6/) (Estève & Dobrovoljc, EACL 2026)
ACL