@inproceedings{takase-etal-2018-direct,
title = "Direct Output Connection for a High-Rank Language Model",
author = "Takase, Sho and
Suzuki, Jun and
Nagata, Masaaki",
editor = "Riloff, Ellen and
Chiang, David and
Hockenmaier, Julia and
Tsujii, Jun{'}ichi",
booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing",
month = oct # "-" # nov,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/D18-1489/",
doi = "10.18653/v1/D18-1489",
pages = "4599--4609",
abstract = "This paper proposes a state-of-the-art recurrent neural network (RNN) language model that combines probability distributions computed not only from a final RNN layer but also middle layers. This method raises the expressive power of a language model based on the matrix factorization interpretation of language modeling introduced by Yang et al. (2018). Our proposed method improves the current state-of-the-art language model and achieves the best score on the Penn Treebank and WikiText-2, which are the standard benchmark datasets. Moreover, we indicate our proposed method contributes to application tasks: machine translation and headline generation."
}
Markdown (Informal)
[Direct Output Connection for a High-Rank Language Model](https://preview.aclanthology.org/jlcl-multiple-ingestion/D18-1489/) (Takase et al., EMNLP 2018)
ACL
- Sho Takase, Jun Suzuki, and Masaaki Nagata. 2018. Direct Output Connection for a High-Rank Language Model. In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pages 4599–4609, Brussels, Belgium. Association for Computational Linguistics.