@inproceedings{rodriguez-mendoza-2025-logitrouter,
title = "{L}ogit{R}outer: a novel Attention variant for reducing Myopic Routing in Mixture of Experts",
author = "Rodriguez, Felipe and
Mendoza, Marcelo",
editor = "Flek, Lucie and
Narayan, Shashi and
Phương, L{\^e} Hồng and
Pei, Jiahuan",
booktitle = "Proceedings of the 18th International Natural Language Generation Conference",
month = oct,
year = "2025",
address = "Hanoi, Vietnam",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-luhme/2025.inlg-main.30/",
pages = "499--510",
abstract = "Mixture of Experts (MoEs) have emerged as strong alternatives to traditional transformers, offering significant advantages in terms of training and inference efficiency. At the core of this architecture lies the router, responsible for selecting which experts are activated for each token. However, despite these advances, routing mechanisms continue to face stability challenges that the basic architecture fails to fully address. One such issue is Myopic Routing, where each token determines its route independently, without considering the routing decisions made for other tokens. To address this limitation, the LogitAttention mechanism is introduced{---}a variant of traditional attention{---}and, building upon it, the LogitRouter, a novel routing architecture that incorporates contextual information about the routing of other tokens. Due to budget constraints, a set of simple experiments is designed to obtain preliminary evidence of performance trends. These experiments are empirically validated on established benchmarks such as BoolQ, MMLU, and ARC. Finally, the work concludes with an in-depth discussion of architectural variants, applicability, limitations, and future directions, which aims to support continued research in this area."
}Markdown (Informal)
[LogitRouter: a novel Attention variant for reducing Myopic Routing in Mixture of Experts](https://preview.aclanthology.org/ingest-luhme/2025.inlg-main.30/) (Rodriguez & Mendoza, INLG 2025)
ACL