@inproceedings{van-hautte-etal-2019-bad,
title = "Bad Form: Comparing Context-Based and Form-Based Few-Shot Learning in Distributional Semantic Models",
author = "Van Hautte, Jeroen and
Emerson, Guy and
Rei, Marek",
editor = "Cherry, Colin and
Durrett, Greg and
Foster, George and
Haffari, Reza and
Khadivi, Shahram and
Peng, Nanyun and
Ren, Xiang and
Swayamdipta, Swabha",
booktitle = "Proceedings of the 2nd Workshop on Deep Learning Approaches for Low-Resource NLP (DeepLo 2019)",
month = nov,
year = "2019",
address = "Hong Kong, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/D19-6104/",
doi = "10.18653/v1/D19-6104",
pages = "31--39",
abstract = "Word embeddings are an essential component in a wide range of natural language processing applications. However, distributional semantic models are known to struggle when only a small number of context sentences are available. Several methods have been proposed to obtain higher-quality vectors for these words, leveraging both this context information and sometimes the word forms themselves through a hybrid approach. We show that the current tasks do not suffice to evaluate models that use word-form information, as such models can easily leverage word forms in the training data that are related to word forms in the test data. We introduce 3 new tasks, allowing for a more balanced comparison between models. Furthermore, we show that hyperparameters that have largely been ignored in previous work can consistently improve the performance of both baseline and advanced models, achieving a new state of the art on 4 out of 6 tasks."
}
Markdown (Informal)
[Bad Form: Comparing Context-Based and Form-Based Few-Shot Learning in Distributional Semantic Models](https://preview.aclanthology.org/jlcl-multiple-ingestion/D19-6104/) (Van Hautte et al., 2019)
ACL