@inproceedings{zhang-etal-2026-llmeval, title = "{LLME}val-Fair: A Large-Scale Longitudinal Study on Robust and Fair Evaluation of Large Language Models", author = "Zhang, Ming and Shen, Yujiong and Deng, Jingyi and Wang, Yuhui and Sha, Huayu and Tan, Kexin and Peng, Qiyuan and Zhang, Yue and Wang, Junzhe and Liu, Shichun and Huang, Yueyuan and Tong, Jingqi and Jiang, Changhao and Wu, Yilong and Zhang, Zhihao and Wu, Mingqi and Chai, Mingxu and Xi, Zhiheng and Dou, Shihan and Gui, Tao and Zhang, Qi and Huang, Xuanjing", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.972/", pages = "21246--21273", ISBN = "979-8-89176-390-6" }