@inproceedings{zhang-etal-2025-advancing,
title = "Advancing {M}o{E} Efficiency: A Collaboration-Constrained Routing ($\texttt{C2R}$) Strategy for Better Expert Parallelism Design",
author = "Zhang, Mohan and
Li, Pingzhi and
Peng, Jie and
Qiu, Mufan and
Chen, Tianlong",
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.naacl-long.347/",
pages = "6815--6825",
ISBN = "979-8-89176-189-6"
}
Markdown (Informal)
[Advancing MoE Efficiency: A Collaboration-Constrained Routing (C2R) Strategy for Better Expert Parallelism Design](https://preview.aclanthology.org/fix-sig-urls/2025.naacl-long.347/) (Zhang et al., NAACL 2025)
ACL