@inproceedings{wandmacher-antoine-2006-training,
title = "Training Language Models without Appropriate Language Resources: Experiments with an {AAC} System for Disabled People",
author = "Wandmacher, Tonio and
Antoine, Jean-Yves",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Gangemi, Aldo and
Maegaard, Bente and
Mariani, Joseph and
Odijk, Jan and
Tapias, Daniel",
booktitle = "Proceedings of the Fifth International Conference on Language Resources and Evaluation ({LREC}{'}06)",
month = may,
year = "2006",
address = "Genoa, Italy",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/fix-sig-urls/L06-1059/",
abstract = "Statistical Language Models (LM) are highly dependent on their training resources. This makes it not only difficult to interpret evaluation results, it also has a deteriorating effect on the use of an LM-based application. This question has already been studied by others. Considering a specific domain (text prediction in a communication aid for handicapped people) we want to address the problem from a different point of view: the influence of the language register. Considering corpora from five different registers, we want to discuss three methods to adapt a language model to its actual language resource ultimately reducing the effect of training dependency: (a) A simple cache model augmenting the probability of the n last inserted words; (b) a user dictionary, keeping every unseen word; and (c) a combined LM interpolating a base model with a dynamically updated user model. Our evaluation is based on the results obtained from a text prediction system working on a trigram LM."
}
Markdown (Informal)
[Training Language Models without Appropriate Language Resources: Experiments with an AAC System for Disabled People](https://preview.aclanthology.org/fix-sig-urls/L06-1059/) (Wandmacher & Antoine, LREC 2006)
ACL