@article{pinto-etal-2026-relex,
title = "{R}el{E}x-{PT}: A {P}ortuguese Sentence-Level Relation Extraction Dataset",
author = "Pinto, Tom{\'a}s and
Silva, Catarina and
Goncalo Oliveira, Hugo",
editor = "Piperidis, Stelios and
Bel, N{\'u}ria and
van den Heuvel, Henk and
Ide, Nancy and
Krek, Simon and
Toral, Antonio",
journal = "International Conference on Language Resources and Evaluation",
volume = "main",
month = may,
year = "2026",
address = "Palma de Mallorca, Spain",
publisher = "ELRA Language Resource Association",
url = "https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.609/",
pages = "7681--7691",
abstract = "We introduce RelEx-PT, a new sentence-level Relation Extraction dataset for Portuguese. Addressing the scarcity of high-quality, controlled resources for the language, RelEx-PT provides a balanced benchmark comprising 18 Wikidata-derived relation types across diverse domains. The dataset is built through a distant supervision pipeline that links Wikidata triples with Portuguese Wikipedia sentences and enhanced by a Natural Language Inference (NLI)-based filtering process, combining scalability with quality assurance. Additionally, we conduct baseline experiments to evaluate the dataset{'}s applicability across diverse extraction settings, including Relation Classification (RC), Relation Triple Extraction, and Open Information Extraction. These experiments leverage both prompting and fine-tuning strategies using Large Language Models. The results show that RelEx-PT effectively supports a range of extraction paradigms, yielding high performance in RC and competitive results in structured triple generation, while also highlighting key challenges in open-ended extraction."
}Markdown (Informal)
[RelEx-PT: A Portuguese Sentence-Level Relation Extraction Dataset](https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.609/) (Pinto et al., LREC 2026)
ACL