@inproceedings{escouflaire-2026-crocosyn-cross,
title = "{C}ro{C}o{S}yn: A Cross-Lingual and Cross-Model Corpus of {LLM}-Generated Film Synopses",
author = "Escouflaire, Louis",
editor = "Alves, Diego and
Bizzoni, Yuri and
Degaetano-Ortlieb, Stefania and
Kazantseva, Anna and
Pagel, Janis and
Szpakowicz, Stan",
booktitle = "Proceedings of the 10th Joint {SIGHUM} Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature 2026",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.latechclfl-1.4/",
pages = "30--35",
ISBN = "979-8-89176-373-9",
abstract = "We introduce CroCoSyn, a controlled, cross-lingual and cross-model corpus of 25,920 LLM-generated film synopses in English and French. Each synopsis is generated under systematically varied conditions, including model type, temperature, genre, protagonist gender, and narrative constraints, and enriched with structured metadata capturing characters and their relationships. Comparing Mistral and Llama across different model temperature degrees, CroCoSyn enables fine-grained analysis of narrative content, style, and character representation across models and languages. The corpus supports research on gender and cultural biases and story generation evaluation, and provides a foundation for comparative studies between LLM-generated and human-written narratives."
}Markdown (Informal)
[CroCoSyn: A Cross-Lingual and Cross-Model Corpus of LLM-Generated Film Synopses](https://preview.aclanthology.org/ingest-eacl/2026.latechclfl-1.4/) (Escouflaire, LaTeCH-CLfL 2026)
ACL