@inproceedings{park-kim-2025-evaluating,
title = "Evaluating Multimodal Generative {AI} with {K}orean Educational Standards",
author = "Park, Sanghee and
Kim, Geewook",
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 2: Short Papers)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.naacl-short.56/",
pages = "671--688",
ISBN = "979-8-89176-190-2",
abstract = "This paper presents the Korean National Educational Test Benchmark (KoNET), a new benchmark designed to evaluate Multimodal Generative AI Systems using Korean national educational tests. KoNET comprises four exams: the Korean Elementary General Educational Development Test (KoEGED), Middle (KoMGED), High (KoHGED), and College Scholastic Ability Test (KoCSAT). These exams are renowned for their rigorous standards and diverse questions, facilitating a comprehensive analysis of AI performance across different educational levels. By focusing on Korean, KoNET provides insights into model performance in less-explored languages. We assess a range of models{---}open-source, open-access, and closed APIs{---}by examining difficulties, subject diversity, and human error rates. The code and dataset builder will be made fully open-source."
}
Markdown (Informal)
[Evaluating Multimodal Generative AI with Korean Educational Standards](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.naacl-short.56/) (Park & Kim, NAACL 2025)
ACL
- Sanghee Park and Geewook Kim. 2025. Evaluating Multimodal Generative AI with Korean Educational Standards. In Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 2: Short Papers), pages 671–688, Albuquerque, New Mexico. Association for Computational Linguistics.