@inproceedings{clark-etal-2008-toward,
title = "Toward Active Learning in Data Selection: Automatic Discovery of Language Features During Elicitation",
author = "Clark, Jonathan and
Frederking, Robert and
Levin, Lori",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Maegaard, Bente and
Mariani, Joseph and
Odijk, Jan and
Piperidis, Stelios and
Tapias, Daniel",
booktitle = "Proceedings of the Sixth International Conference on Language Resources and Evaluation ({LREC}`08)",
month = may,
year = "2008",
address = "Marrakech, Morocco",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/L08-1059/",
abstract = "Data Selection has emerged as a common issue in language technologies. We define Data Selection as the choosing of a subset of training data that is most effective for a given task. This paper describes deductive feature detection, one component of a data selection system for machine translation. Feature detection determines whether features such as tense, number, and person are expressed in a language. The database of the The World Atlas of Language Structures provides a gold standard against which to evaluate feature detection. The discovered features can be used as input to a Navigator, which uses active learning to determine which piece of language data is the most important to acquire next."
}
Markdown (Informal)
[Toward Active Learning in Data Selection: Automatic Discovery of Language Features During Elicitation](https://preview.aclanthology.org/add-emnlp-2024-awards/L08-1059/) (Clark et al., LREC 2008)
ACL