@inproceedings{byrne-etal-2022-topic,
title = "Topic Modeling With Topological Data Analysis",
author = "Byrne, Ciar{\'a}n and
Horak, Danijela and
Moilanen, Karo and
Mabona, Amandla",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2022.emnlp-main.792/",
doi = "10.18653/v1/2022.emnlp-main.792",
pages = "11514--11533",
abstract = "Recent unsupervised topic modelling ap-proaches that use clustering techniques onword, token or document embeddings can ex-tract coherent topics. A common limitationof such approaches is that they reveal noth-ing about inter-topic relationships which areessential in many real-world application do-mains. We present an unsupervised topic mod-elling method which harnesses TopologicalData Analysis (TDA) to extract a topologicalskeleton of the manifold upon which contextu-alised word embeddings lie. We demonstratethat our approach, which performs on par witha recent baseline, is able to construct a networkof coherent topics together with meaningfulrelationships between them."
}
Markdown (Informal)
[Topic Modeling With Topological Data Analysis](https://preview.aclanthology.org/jlcl-multiple-ingestion/2022.emnlp-main.792/) (Byrne et al., EMNLP 2022)
ACL
- Ciarán Byrne, Danijela Horak, Karo Moilanen, and Amandla Mabona. 2022. Topic Modeling With Topological Data Analysis. In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pages 11514–11533, Abu Dhabi, United Arab Emirates. Association for Computational Linguistics.