@inproceedings{maupome-meurs-2020-language,
title = "Language Modeling with a General Second-Order {RNN}",
author = "Maupom{\'e}, Diego and
Meurs, Marie-Jean",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Moreno, Asuncion and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Twelfth Language Resources and Evaluation Conference",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://preview.aclanthology.org/fix-sig-urls/2020.lrec-1.584/",
pages = "4749--4753",
language = "eng",
ISBN = "979-10-95546-34-4",
abstract = "Different Recurrent Neural Network (RNN) architectures update their state in different manners as the input sequence is processed. RNNs including a multiplicative interaction between their current state and the current input, second-order ones, show promising performance in language modeling. In this paper, we introduce a second-order RNNs that generalizes existing ones. Evaluating on the Penn Treebank dataset, we analyze how its different components affect its performance in character-lever recurrent language modeling. We perform our experiments controlling the parameter counts of models. We find that removing the first-order terms does not hinder performance. We perform further experiments comparing the effects of the relative size of the state space and the multiplicative interaction space on performance. Our expectation was that a larger states would benefit language models built on longer documents, and larger multiplicative interaction states would benefit ones built on larger input spaces. However, our results suggest that this is not the case and the optimal relative size is the same for both document tokenizations used."
}
Markdown (Informal)
[Language Modeling with a General Second-Order RNN](https://preview.aclanthology.org/fix-sig-urls/2020.lrec-1.584/) (Maupomé & Meurs, LREC 2020)
ACL
- Diego Maupomé and Marie-Jean Meurs. 2020. Language Modeling with a General Second-Order RNN. In Proceedings of the Twelfth Language Resources and Evaluation Conference, pages 4749–4753, Marseille, France. European Language Resources Association.