@inproceedings{indig-borbala-bajzat-2024-compressing,
title = "Compressing Noun Phrases to Discover Mental Constructions in Corpora {--} A Case Study for Auxiliaries in {H}ungarian",
author = "Indig, Bal{\'a}zs and
Borb{\'a}la Bajz{\'a}t, T{\'i}mea",
editor = {H{\"a}m{\"a}l{\"a}inen, Mika and
Pirinen, Flammie and
Macias, Melany and
Crespo Avila, Mario},
booktitle = "Proceedings of the 9th International Workshop on Computational Linguistics for Uralic Languages",
month = nov,
year = "2024",
address = "Helsinki, Finland",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.iwclul-1.12/",
pages = "96--103",
abstract = "The quantitative turn in functional linguistics has emphasised the importance of data-oriented methods in describing linguistic patterns. However, there are significant differences between constructions and the examples they cover, which need to be properly formalised. For example, noun chains introduce significant variation in the examples, making it difficult to identify underlying patterns. The compression of noun chains into their minimal form (e.g. as they appear in abstract constructions) is a promising method for revealing linguistic patterns in corpora through their examples. This method, combined with identifying the appropriate level of abstraction for the additional elements present, allows for the systematic extraction of good construction candidates. A pilot has been developed for Hungarian infinitive structures, but is adaptable for various linguistic structures and other agglutinative languages."
}
Markdown (Informal)
[Compressing Noun Phrases to Discover Mental Constructions in Corpora – A Case Study for Auxiliaries in Hungarian](https://preview.aclanthology.org/fix-sig-urls/2024.iwclul-1.12/) (Indig & Borbála Bajzát, IWCLUL 2024)
ACL