@inproceedings{babakov-bugarin-diz-2026-decomposition,
title = "Decomposition Does Not Help: Evidence from Semantic Clustering in {LLM}-based Causal Graph Discovery",
author = "Babakov, Nikolay and
Bugar{\'i}n-Diz, Alberto",
editor = "Mahamood, Saad and
Howcroft, David M. and
van Deemter, Kees and
Balloccu, Simone and
Sivaprasad, Adarsa and
Sundararajan, Barkavi and
Bugar{\'i}n Diz, Alberto and
Alonso-Moral, Jose Mar{\'i}a",
booktitle = "Proceedings of the 1st Symposium on Natural Language Generation Evaluations",
month = jun,
year = "2026",
address = "Aberdeen, United Kingdom",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-retroeval/2026.retroeval-main.1/",
pages = "1--7",
ISBN = "979-8-89176-436-1",
abstract = "Recent advances in large language models (LLMs) have enabled their application to non-traditional tasks such as causal graph construction, a key component of reasoning frameworks, including Bayesian Networks. The most effective existing approaches rely on direct prompting, where an LLM generates a complete graph from a full set of variables in a single step. However, the performance of such methods degrades as the number of graph nodes increases. To address this limitation, we explore a divide-and-conquer alternative based on semantic clustering. Node representations are first embedded and clustered, after which subgraphs are constructed independently for each cluster using LLM prompting. The resulting subgraphs are then merged pairwise into a global graph. Contrary to our expectations, this approach leads to a substantial degradation in performance compared to direct prompting baselines, as measured by Structural Hamming Distance (SHD). We attribute this to the misalignment between semantic similarity and causal structure, as well as error propagation during subgraph merging. We report these negative results to highlight the limitations of decomposition strategies in LLM-based causal graphs construction."
}Markdown (Informal)
[Decomposition Does Not Help: Evidence from Semantic Clustering in LLM-based Causal Graph Discovery](https://preview.aclanthology.org/ingest-retroeval/2026.retroeval-main.1/) (Babakov & Bugarín-Diz, RetroEval 2026)
ACL