@inproceedings{han-etal-2026-mpresenter,
title = "m{P}resenter: An Agentic Framework for Generating Multilingual Presentation Videos from Scientific Papers",
author = "Han, Wenhan and
Xiao, Xiao and
Pechenizkiy, Mykola and
Fang, Meng",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.findings-acl.805/",
pages = "16358--16371",
ISBN = "979-8-89176-395-1",
abstract = "Generating presentation videos from scientific papers is challenging due to the need for long-document discourse planning and cross-lingual grounding. Existing Paper2Video systems are largely monolingual and often rely on single-pass pipelines, which can limit the coherence and informativeness of the resulting presentations.We present mPresenter, a multilingual agentic Paper2Video system that decomposes the task into planning, audience-oriented critique, layout-aware slide generation, and multilingual figure interpretation, enabling iterative refinement at the discourse level. To facilitate reproducible evaluation, we also introduce mPreBench, a multilingual benchmark that evaluates presentation videos via question answering as a proxy for effective information transfer. Experimental results indicate that mPresenter improves question-answering accuracy relative to prior systems, while maintaining affordable cost and latency."
}Markdown (Informal)
[mPresenter: An Agentic Framework for Generating Multilingual Presentation Videos from Scientific Papers](https://preview.aclanthology.org/ingest-acl-workshops/2026.findings-acl.805/) (Han et al., Findings 2026)
ACL