@inproceedings{phan-chiang-2025-mymy,
title = "{M}y{M}y at {S}em{E}val-2025 Task 9: A Robust Knowledge-Augmented Data Approach for Reliable Food Hazard Detection",
author = "Phan, Ben and
Chiang, Jung-Hsien",
editor = "Rosenthal, Sara and
Ros{\'a}, Aiala and
Ghosh, Debanjan and
Zampieri, Marcos",
booktitle = "Proceedings of the 19th International Workshop on Semantic Evaluation (SemEval-2025)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/tal-24-ingestion/2025.semeval-1.112/",
pages = "812--822",
ISBN = "979-8-89176-273-2",
abstract = "The Food Hazard Detection (SemEval-2025 Task 9) advances explainable classification of food-incident reports collected from web sources, including social media and regulatory agency websites, to support timely risk mitigation for public health and the economy. This task is complicated by a highly imbalanced, long-tail label distribution and the need for transparent, reliable AI. We present a robust Knowledge-Augmented Data approach that integrates Retrieval-Augmented Generation (RAG) with domain-specific knowledge from the PubMed API to enrich and balance the training data. Our method leverages domain-specific knowledge to expand datasets and curate high-quality data that enhances overall data integrity. We hypothesize that Knowledge-Augmented Data improves Macro-F1 scores, the primary evaluation metric. Our approach achieved a top-2 ranking across both subtasks, demonstrating its effectiveness in advancing NLP applications for food safety and contributing to more reliable food hazard detection."
}
Markdown (Informal)
[MyMy at SemEval-2025 Task 9: A Robust Knowledge-Augmented Data Approach for Reliable Food Hazard Detection](https://preview.aclanthology.org/tal-24-ingestion/2025.semeval-1.112/) (Phan & Chiang, SemEval 2025)
ACL