@inproceedings{tercon-dobrovoljc-2025-comparatree,
title = "{C}ompara{T}ree: A Multi-Level Comparative Treebank Analysis Tool",
author = "Ter{\v{c}}on, Luka and
Dobrovoljc, Kaja",
editor = {Jablotschkin, Sarah and
K{\"u}bler, Sandra and
Zinsmeister, Heike},
booktitle = "Proceedings of the 23rd International Workshop on Treebanks and Linguistic Theories (TLT, SyntaxFest 2025)",
month = aug,
year = "2025",
address = "Ljubljana, Slovenia",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/corrections-2025-08/2025.tlt-1.15/",
pages = "129--139",
ISBN = "979-8-89176-291-6",
abstract = "ComparaTree is a tool for comparative treebank analysis that combines various methods of quantitative linguistic analysis to provide a general overview of the differences and similarities between two treebanks. The comparison tool covers a range of subfields of linguistic analysis, providing a summary of the differences and similarities in terms of the lexical diversity, n-gram diversity, part-of-speech and dependency relation proportions, syntactic complexity, and syntactic diversity. We explain the various quantitative analyses performed on every level along with the generation of graphical visualizations, which add value by enabling user-friendly comparisons at a glance. We exemplify the comparison process by presenting the results produced by the tool when comparing two treebanks from the Universal Dependencies collection."
}
Markdown (Informal)
[ComparaTree: A Multi-Level Comparative Treebank Analysis Tool](https://preview.aclanthology.org/corrections-2025-08/2025.tlt-1.15/) (Terčon & Dobrovoljc, TLT-SyntaxFest 2025)
ACL