@inproceedings{tefnik-kadlcik-2023-context,
title = "Can In-context Learners Learn a Reasoning Concept from Demonstrations?",
author = "{\v{S}}tef{\'a}nik, Michal and
Kadl{\v{c}}{\'i}k, Marek",
editor = "Dalvi Mishra, Bhavana and
Durrett, Greg and
Jansen, Peter and
Neves Ribeiro, Danilo and
Wei, Jason",
booktitle = "Proceedings of the 1st Workshop on Natural Language Reasoning and Structured Explanations (NLRSE)",
month = jun,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.nlrse-1.8/",
doi = "10.18653/v1/2023.nlrse-1.8",
pages = "107--115",
abstract = "Large language models show an emergent ability to learn a new task from a small number of input-output demonstrations. However, recent work shows that in-context learners largely rely on their pre-trained knowledge, such as the sentiment of the labels, instead of finding new associations in the input. However, the commonly-used few-shot evaluation settings using a random selection of in-context demonstrations can not disentangle models' ability to learn a new skill from demonstrations, as most of the randomly-selected demonstrations do not present relations informative for prediction beyond exposing the new task distribution. To disentangle models' in-context learning ability independent of models' memory, we introduce a Conceptual few-shot learning method selecting the demonstrations sharing a possibly-informative concept with the predicted sample. We extract a set of such concepts from annotated explanations and measure how much can models benefit from presenting these concepts in few-shot demonstrations. We find that smaller models are more sensitive to the presented concepts. While some of the models are able to benefit from concept-presenting demonstrations for each assessed concept, we find that none of the assessed in-context learners can benefit from all presented reasoning concepts consistently, leaving the in-context concept learning an open challenge."
}
Markdown (Informal)
[Can In-context Learners Learn a Reasoning Concept from Demonstrations?](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.nlrse-1.8/) (Štefánik & Kadlčík, NLRSE 2023)
ACL