@inproceedings{ozaki-etal-2024-long, title = "Long Unit Word Tokenization and Bunsetsu Segmentation of Historical {J}apanese", author = "Ozaki, Hiroaki and Komiya, Kanako and Asahara, Masayuki and Ogiso, Toshinobu", editor = "Pavlopoulos, John and Sommerschield, Thea and Assael, Yannis and Gordin, Shai and Cho, Kyunghyun and Passarotti, Marco and Sprugnoli, Rachele and Liu, Yudong and Li, Bin and Anderson, Adam", booktitle = "Proceedings of the 1st Workshop on Machine Learning for Ancient Languages (ML4AL 2024)", month = aug, year = "2024", address = "Hybrid in Bangkok, Thailand and online", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2024.ml4al-1.6/", doi = "10.18653/v1/2024.ml4al-1.6", pages = "48--55" }