@inproceedings{sternik-etal-2026-using,
title = "Using k-Shot Prompting with Large k for the Automated Scoring of a {G}erman Written Elicited Imitation Test",
author = "Sternik, Malte and
Laarmann-Quante, Ronja and
Drackert, Anastasia",
editor = "Kochmar, Ekaterina and
Alhafni, Bashar and
Bann{\`o}, Stefano and
Bexte, Marie and
Burstein, Jill and
Horbach, Andrea and
Laarmann-Quante, Ronja and
Tack, Anais and
Yaneva, Victoria and
Yuan, Zheng",
booktitle = "Proceedings of the 21st Workshop on Innovative Use of {NLP} for Building Educational Applications ({BEA} 2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.bea-1.20/",
pages = "272--280",
ISBN = "979-8-89176-409-5",
abstract = "This paper explores the application of a Large Language Model (LLM) using k-shot prompting with large k for automatically scoring a German Written Elicited Imitation Test (WEIT), a test for assessing literacy-dependent procedural knowledge in German as a foreign language. In this test, test-takers are briefly presented with written sentences which they then have to reproduce in writing as accurately as possible. The responses are scored on an ordinal scale which differentiates between different types of errors (e.g. lexical vs. grammatical). We find that with increasing k (in a range from 1 to 700) accuracy increases significantly but it also depends on the drawn sample and varies across different runs of the same prompt. Overall, the k-shot setting which relies on in-context learning without being provided with the scoring rubric outperforms a baseline where only the scoring rubric is provided to the model. However, the LLM does not outperform previous results based on rule-based or BERT-based models."
}Markdown (Informal)
[Using k-Shot Prompting with Large k for the Automated Scoring of a German Written Elicited Imitation Test](https://preview.aclanthology.org/ingest-acl-workshops/2026.bea-1.20/) (Sternik et al., BEA 2026)
ACL