@inproceedings{park-kim-2025-understanding,
title = "Understanding {LLM} Development Through Longitudinal Study: Insights from the Open {K}o-{LLM} Leaderboard",
author = "Park, Chanjun and
Kim, Hyeonwoo",
editor = "Chen, Weizhu and
Yang, Yi and
Kachuee, Mohammad and
Fu, Xue-Yong",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 3: Industry Track)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.naacl-industry.1/",
pages = "1--8",
ISBN = "979-8-89176-194-0",
abstract = "This paper conducts a longitudinal study over eleven months to address the limitations of prior research on the Open Ko-LLM Leaderboard, which have relied on empirical studies with restricted observation periods of only five months. By extending the analysis duration, we aim to provide a more comprehensive understanding of the progression in developing Korean large language models (LLMs). Our study is guided by three primary research questions: (1) What are the specific challenges in improving LLM performance across diverse tasks on the Open Ko-LLM Leaderboard over time? (2) How does model size impact task performance correlations across various benchmarks? (3) How have the patterns in leaderboard rankings shifted over time on the Open Ko-LLM Leaderboard?. By analyzing 1,769 models over this period, our research offers a comprehensive examination of the ongoing advancements in LLMs and the evolving nature of evaluation frameworks."
}
Markdown (Informal)
[Understanding LLM Development Through Longitudinal Study: Insights from the Open Ko-LLM Leaderboard](https://preview.aclanthology.org/fix-sig-urls/2025.naacl-industry.1/) (Park & Kim, NAACL 2025)
ACL