@inproceedings{tran-etal-2025-vaediff,
title = "{V}ae{D}iff-{D}oc{RE}: End-to-end Data Augmentation Framework for Document-level Relation Extraction",
author = "Tran, Khai Phan and
Hua, Wen and
Li, Xue",
editor = "Rambow, Owen and
Wanner, Leo and
Apidianaki, Marianna and
Al-Khalifa, Hend and
Eugenio, Barbara Di and
Schockaert, Steven",
booktitle = "Proceedings of the 31st International Conference on Computational Linguistics",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.488/",
pages = "7307--7320",
abstract = "Document-level Relation Extraction (DocRE) aims to identify relationships between entity pairs within a document. However, most existing methods assume a uniform label distribution, resulting in suboptimal performance on real-world, imbalanced datasets. To tackle this challenge, we propose a novel data augmentation approach using generative models to enhance data from the embedding space. Our method leverages the Variational Autoencoder (VAE) architecture to capture all relation-wise distributions formed by entity pair representations and augment data for underrepresented relations. To better capture the multi-label nature of DocRE, we parameterize the VAE`s latent space with a Diffusion Model. Additionally, we introduce a hierarchical training framework to integrate the proposed VAE-based augmentation module into DocRE systems. Experiments on two benchmark datasets demonstrate that our method outperforms state-of-the-art models, effectively addressing the long-tail distribution problem in DocRE. Our code is released at: https://github.com/khaitran22/VaeDiff-DocRE"
}
Markdown (Informal)
[VaeDiff-DocRE: End-to-end Data Augmentation Framework for Document-level Relation Extraction](https://preview.aclanthology.org/jlcl-multiple-ingestion/2025.coling-main.488/) (Tran et al., COLING 2025)
ACL