@inproceedings{cohen-etal-2025-historical,
title = "Historical Ink: Exploring Large Language Models for Irony Detection in 19th-Century {S}panish",
author = "Cohen, Kevin and
Manrique-G{\'o}mez, Laura and
Manrique, Ruben",
editor = {H{\"a}m{\"a}l{\"a}inen, Mika and
{\"O}hman, Emily and
Bizzoni, Yuri and
Miyagawa, So and
Alnajjar, Khalid},
booktitle = "Proceedings of the 5th International Conference on Natural Language Processing for Digital Humanities",
month = may,
year = "2025",
address = "Albuquerque, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.nlp4dh-1.48/",
pages = "559--569",
ISBN = "979-8-89176-234-3",
abstract = "This study explores the use of large language models (LLMs) to enhance datasets and improve irony detection in 19th-century Latin American newspapers. Two strategies were employed to evaluate the efficacy of BERT and GPT models in capturing the subtle nuances nature of irony, through both multi-class and binary classification tasks. First, we implemented dataset enhancements focused on enriching emotional and contextual cues; however, these showed limited impact on historical language analysis. The second strategy, a semi-automated annotation process, effectively addressed class imbalance and augmented the dataset with high-quality annotations. Despite the challenges posed by the complexity of irony, this work contributes to the advancement of sentiment analysis through two key contributions: introducing a new historical Spanish dataset tagged for sentiment analysis and irony detection, and proposing a semi-automated annotation methodology where human expertise is crucial for refining LLMs results, enriched by incorporating historical and cultural contexts as core features."
}
Markdown (Informal)
[Historical Ink: Exploring Large Language Models for Irony Detection in 19th-Century Spanish](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.nlp4dh-1.48/) (Cohen et al., NLP4DH 2025)
ACL