@inproceedings{liu-etal-2026-temporal-tokenization,
title = "Temporal Tokenization Strategies for Event Sequence Modeling with Large Language Models",
author = "Liu, Zefang and
Nguyen, Nam H and
Quan, Yinzhu and
Zhang, Shi-Xiong",
editor = "Mille, Simon and
Gehrmann, Sebastian and
Schmidtov{\'a}, Patr{\'i}cia and
Du{\v{s}}ek, Ond{\v{r}}ej and
Fadaee, Marzieh and
Lo, Kyle and
Santus, Enrico and
Stanovsky, Gabriel",
booktitle = "Proceedings of the Fifth Workshop on Generation, Evaluation and Metrics ({GEM})",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.5/",
pages = "41--51",
ISBN = "979-8-89176-423-1",
abstract = "Representing continuous time is a critical and under-explored challenge in modeling temporal event sequences with large language models (LLMs). Various strategies like byte-level representations or calendar tokens have been proposed. However, the optimal approach remains unclear, especially given the diverse statistical distributions of real-world event data, which range from smooth log-normal to discrete, spiky patterns. This paper presents a systematic empirical study of temporal tokenization for modeling event sequences with LLMs, comparing distinct encoding strategies: naive numeric strings, high-precision byte-level representations, human-semantic calendar tokens, classic uniform binning, and adaptive residual scalar quantization. We evaluate these strategies by fine-tuning LLMs on real-world datasets that exemplify these diverse distributions. Our analysis reveals that no single strategy is universally superior; instead, prediction performance depends heavily on aligning the tokenizer with the data{'}s statistical properties, highlighting temporal tokenization as a critical yet often overlooked design dimension in LLM-based event modeling."
}Markdown (Informal)
[Temporal Tokenization Strategies for Event Sequence Modeling with Large Language Models](https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.5/) (Liu et al., GEM 2026)
ACL