@inproceedings{keyaki-keyaki-2024-coarse,
title = "Coarse-Tuning for Ad-hoc Document Retrieval Using Pre-trained Language Models",
author = "Keyaki, Atsushi and
Keyaki, Ribeka",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.lrec-main.303/",
pages = "3413--3421",
abstract = "Fine-tuning in information retrieval systems using pre-trained language models (PLM-based IR) requires learning query representations and query-document relations, in addition to downstream task-specific learning. This study introduces coarse-tuning as an intermediate learning stage that bridges pre-training and fine-tuning. By learning query representations and query-document relations in coarse-tuning, we aim to reduce the load of fine-tuning and improve the learning effect of downstream IR tasks. We propose Query-Document Pair Prediction (QDPP) for coarse-tuning, which predicts the appropriateness of query-document pairs. Evaluation experiments show that the proposed method significantly improves MRR and/or nDCG@5 in four ad-hoc document retrieval datasets. Furthermore, the results of the query prediction task suggested that coarse-tuning facilitated learning of query representation and query-document relations."
}
Markdown (Informal)
[Coarse-Tuning for Ad-hoc Document Retrieval Using Pre-trained Language Models](https://preview.aclanthology.org/fix-sig-urls/2024.lrec-main.303/) (Keyaki & Keyaki, LREC-COLING 2024)
ACL