@inproceedings{dang-etal-2025-tokenization,
title = "Tokenization and Morphology in Multilingual Language Models: A Comparative Analysis of m{T}5 and {B}y{T}5",
author = "Dang, Thao Anh and
Raviv, Limor and
Galke, Lukas",
editor = "Abbas, Mourad and
Yousef, Tariq and
Galke, Lukas",
booktitle = "Proceedings of the 8th International Conference on Natural Language and Speech Processing (ICNLSP-2025)",
month = aug,
year = "2025",
address = "Southern Denmark University, Odense, Denmark",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/corrections-2025-10/2025.icnlsp-1.24/",
pages = "242--257"
}
Markdown (Informal)
[Tokenization and Morphology in Multilingual Language Models: A Comparative Analysis of mT5 and ByT5](https://preview.aclanthology.org/corrections-2025-10/2025.icnlsp-1.24/) (Dang et al., ICNLSP 2025)
ACL