@inproceedings{cho-seo-2025-towards,
title = "Towards Reliable and Practical Phishing Detection",
author = "Cho, Hyowon and
Seo, Minjoon",
editor = "Chen, Weizhu and
Yang, Yi and
Kachuee, Mohammad and
Fu, Xue-Yong",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 3: Industry Track)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.naacl-industry.18/",
pages = "210--225",
ISBN = "979-8-89176-194-0",
abstract = "As the prevalence of phishing attacks continues to rise, there is an increasing demand for more robust detection technologies. With recent advances in AI, we discuss how to construct a reliable and practical phishing detection system using language models. For this system, we introduce the first large-scale Korean dataset for phishing detection, encompassing six types of phishing attacks. We consider multiple factors for building a real-time detection system for edge devices, such as model size, Speech-To-Text quality, split length, training technique and multi-task learning. We evaluate the model{'}s ability twofold: in-domain, and unseen attack detection performance which is referred to as zero-day performance. Additionally, we demonstrate the importance of accurate comparison groups and evaluation datasets, showing that voice phishing detection performs reasonably well while smishing detection remains challenging. Both the dataset and the trained model will be available upon request."
}
Markdown (Informal)
[Towards Reliable and Practical Phishing Detection](https://preview.aclanthology.org/fix-sig-urls/2025.naacl-industry.18/) (Cho & Seo, NAACL 2025)
ACL
- Hyowon Cho and Minjoon Seo. 2025. Towards Reliable and Practical Phishing Detection. In Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 3: Industry Track), pages 210–225, Albuquerque, New Mexico. Association for Computational Linguistics.