@inproceedings{huang-etal-2022-reconciliation,
title = "Reconciliation of Pre-trained Models and Prototypical Neural Networks in Few-shot Named Entity Recognition",
author = "Huang, Youcheng and
Lei, Wenqiang and
Fu, Jie and
Lv, Jiancheng",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2022",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2022.findings-emnlp.129/",
doi = "10.18653/v1/2022.findings-emnlp.129",
pages = "1793--1807",
abstract = "Incorporating large-scale pre-trained models with the prototypical neural networks is a de-facto paradigm in few-shot named entity recognition. Existing methods, unfortunately, are not aware of the fact that embeddings from pre-trained models contain a prominently large amount of information regarding word frequencies, biasing prototypical neural networks against learning word entities. This discrepancy constrains the two models' synergy. Thus, we propose a one-line-code normalization method to reconcile such a mismatch with empirical and theoretical grounds. Our experiments based on nine benchmark datasets show the superiority of our method over the counterpart models and are comparable to the state-of-the-art methods. In addition to the model enhancement, our work also provides an analytical viewpoint for addressing the general problems in few-shot name entity recognition or other tasks that rely on pre-trained models or prototypical neural networks."
}
Markdown (Informal)
[Reconciliation of Pre-trained Models and Prototypical Neural Networks in Few-shot Named Entity Recognition](https://preview.aclanthology.org/fix-sig-urls/2022.findings-emnlp.129/) (Huang et al., Findings 2022)
ACL