@inproceedings{kwon-etal-2025-logicqa,
title = "{L}ogic{QA}: Logical Anomaly Detection with Vision Language Model Generated Questions",
author = "Kwon, Yejin and
Moon, Daeun and
Oh, Youngje and
Yoon, Hyunsoo",
editor = "Rehm, Georg and
Li, Yunyao",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 6: Industry Track)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.acl-industry.29/",
pages = "411--432",
ISBN = "979-8-89176-288-6",
abstract = "Anomaly Detection (AD) focuses on detecting samples that differ from the standard pattern, making it a vital tool in process control. Logical anomalies may appear visually normal yet violate predefined constraints on object presence, arrangement, or quantity, depending on reasoning and explainability. We introduce LogicQA, a framework that enhances AD by providing industrial operators with explanations for logical anomalies. LogicQA compiles automatically generated questions into a checklist and collects responses to identify violations of logical constraints. LogicQA is training-free, annotation-free, and operates in a few-shot setting. We achieve state-of-the-art (SOTA) Logical AD performance on public benchmarks, MVTec LOCO AD, with an AUROC of 87.6{\%} and an $F_1$-max of 87.0{\%} along with the explanations of anomalies. Also, our approach has shown outstanding performance on semiconductor SEM corporate data, further validating its effectiveness in industrial applications."
}
Markdown (Informal)
[LogicQA: Logical Anomaly Detection with Vision Language Model Generated Questions](https://preview.aclanthology.org/landing_page/2025.acl-industry.29/) (Kwon et al., ACL 2025)
ACL