@inproceedings{dua-etal-2025-flexdoc, title = "{F}lex{D}oc: Parameterized Sampling for Diverse Multilingual Synthetic Documents for Training Document Understanding Models", author = "Dua, Karan and Patel, Hitesh Laxmichand and Mittal, Puneet and Gupta, Ranjeet and Agarwal, Amit and Pabolu, Praneet and Panda, Srikant and Meghwani, Hansa and Horwood, Graham and Shah, Fahad", editor = "Potdar, Saloni and Rojas-Barahona, Lina and Montella, Sebastien", booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing: Industry Track", month = nov, year = "2025", address = "Suzhou (China)", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-industry.105/", pages = "1500--1521", ISBN = "979-8-89176-333-3" }