@inproceedings{torres-futrell-2023-simpler,
title = "Simpler neural networks prefer subregular languages",
author = "Torres, Charles and
Futrell, Richard",
editor = "Bouamor, Houda and
Pino, Juan and
Bali, Kalika",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2023",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2023.findings-emnlp.112/",
doi = "10.18653/v1/2023.findings-emnlp.112",
pages = "1651--1661",
abstract = "We apply a continuous relaxation of $L_0$ regularization (Louizos et al., 2017), which induces sparsity, to study the inductive biases of LSTMs. In particular, we are interested in the patterns of formal languages which are readily learned and expressed by LSTMs. Across a wide range of tests we find sparse LSTMs prefer subregular languages over regular languages and the strength of this preference increases as we increase the pressure for sparsity. Furthermore LSTMs which are trained on subregular languages have fewer non-zero parameters. We conjecture that this subregular bias in LSTMs is related to the cognitive bias for subregular language observed in human phonology which are both downstream of a simplicity bias in a suitable description language."
}
Markdown (Informal)
[Simpler neural networks prefer subregular languages](https://preview.aclanthology.org/fix-sig-urls/2023.findings-emnlp.112/) (Torres & Futrell, Findings 2023)
ACL