@inproceedings{lavrouk-etal-2025-foundation,
title = "What are Foundation Models Cooking in the Post-Soviet World?",
author = "Lavrouk, Anton and
Naous, Tarek and
Ritter, Alan and
Xu, Wei",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1044/",
pages = "20698--20720",
ISBN = "979-8-89176-332-6",
abstract = "The culture of the Post-Soviet states is complex, shaped by a turbulent history that continues to influence current events. In this study, we investigate the Post-Soviet cultural food knowledge of foundation models by constructing BORSch, a multi-modal dataset encompassing 1147 and 823 dishes in the Russian and Ukrainian languages, centered around the Post-Soviet region. We demonstrate that leading models struggle to correctly identify the origins of dishes from Post-Soviet nations in both text-only and multi-modal Question Answering (QA), instead over-predicting countries linked to the language the question is asked in. Through analysis of pre-training data, we show that these results can be explained by misleading dish-origin co-occurrences, along with linguistic phenomena such as Russian-Ukrainian code mixing. Finally, to move beyond QA-based assessments, we test models' abilities to produce accurate visual descriptions of dishes. The weak correlation between this task and QA suggests that QA alone may be insufficient as an evaluation of cultural understanding."
}Markdown (Informal)
[What are Foundation Models Cooking in the Post-Soviet World?](https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1044/) (Lavrouk et al., EMNLP 2025)
ACL