@inproceedings{wu-etal-2022-representation,
title = "Representation Learning for Resource-Constrained Keyphrase Generation",
author = "Wu, Di and
Ahmad, Wasi and
Dev, Sunipa and
Chang, Kai-Wei",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2022",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2022.findings-emnlp.49/",
doi = "10.18653/v1/2022.findings-emnlp.49",
pages = "700--716",
abstract = "State-of-the-art keyphrase generation methods generally depend on large annotated datasets, limiting their performance in domains with limited annotated data. To overcome this challenge, we design a data-oriented approach that first identifies salient information using retrieval-based corpus-level statistics, and then learns a task-specific intermediate representation based on a pre-trained language model using large-scale unlabeled documents. We introduce salient span recovery and salient span prediction as denoising training objectives that condense the intra-article and inter-article knowledge essential for keyphrase generation. Through experiments on multiple keyphrase generation benchmarks, we show the effectiveness of the proposed approach for facilitating low-resource keyphrase generation and zero-shot domain adaptation. Our method especially benefits the generation of absent keyphrases, approaching the performance of models trained with large training sets."
}
Markdown (Informal)
[Representation Learning for Resource-Constrained Keyphrase Generation](https://preview.aclanthology.org/fix-sig-urls/2022.findings-emnlp.49/) (Wu et al., Findings 2022)
ACL