@inproceedings{white-etal-2021-non,
title = "A Non-Linear Structural Probe",
author = "White, Jennifer C. and
Pimentel, Tiago and
Saphra, Naomi and
Cotterell, Ryan",
editor = "Toutanova, Kristina and
Rumshisky, Anna and
Zettlemoyer, Luke and
Hakkani-Tur, Dilek and
Beltagy, Iz and
Bethard, Steven and
Cotterell, Ryan and
Chakraborty, Tanmoy and
Zhou, Yichao",
booktitle = "Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies",
month = jun,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2021.naacl-main.12/",
doi = "10.18653/v1/2021.naacl-main.12",
pages = "132--138",
abstract = "Probes are models devised to investigate the encoding of knowledge{---}e.g. syntactic structure{---}in contextual representations. Probes are often designed for simplicity, which has led to restrictions on probe design that may not allow for the full exploitation of the structure of encoded information; one such restriction is linearity. We examine the case of a structural probe (Hewitt and Manning, 2019), which aims to investigate the encoding of syntactic structure in contextual representations through learning only linear transformations. By observing that the structural probe learns a metric, we are able to kernelize it and develop a novel non-linear variant with an identical number of parameters. We test on 6 languages and find that the radial-basis function (RBF) kernel, in conjunction with regularization, achieves a statistically significant improvement over the baseline in all languages{---}implying that at least part of the syntactic knowledge is encoded non-linearly. We conclude by discussing how the RBF kernel resembles BERT`s self-attention layers and speculate that this resemblance leads to the RBF-based probe`s stronger performance."
}
Markdown (Informal)
[A Non-Linear Structural Probe](https://preview.aclanthology.org/jlcl-multiple-ingestion/2021.naacl-main.12/) (White et al., NAACL 2021)
ACL
- Jennifer C. White, Tiago Pimentel, Naomi Saphra, and Ryan Cotterell. 2021. A Non-Linear Structural Probe. In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pages 132–138, Online. Association for Computational Linguistics.