@inproceedings{boruta-jastrzebska-2012-phonemic,
title = "A Phonemic Corpus of {P}olish Child-Directed Speech",
author = "Boruta, Luc and
Jastrzebska, Justyna",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Declerck, Thierry and
Do{\u{g}}an, Mehmet U{\u{g}}ur and
Maegaard, Bente and
Mariani, Joseph and
Moreno, Asuncion and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Eighth International Conference on Language Resources and Evaluation ({LREC}'12)",
month = may,
year = "2012",
address = "Istanbul, Turkey",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/fix-sig-urls/L12-1660/",
pages = "1017--1020",
abstract = "Recent advances in modeling early language acquisition are due not only to the development of machine-learning techniques, but also to the increasing availability of data on child language and child-adult interaction. In the absence of recordings of child-directed speech, or when models explicitly require such a representation for training data, phonemic transcriptions are commonly used as input data. We present a novel (and to our knowledge, the first) phonemic corpus of Polish child-directed speech. It is derived from the Weist corpus of Polish, freely available from the seminal CHILDES database. For the sake of reproducibility, and to exemplify the typical trade-off between ecological validity and sample size, we report all preprocessing operations and transcription guidelines. Contributed linguistic resources include updated CHAT-formatted transcripts with phonemic transcriptions in a novel phonology tier, as well as by-product data, such as a phonemic lexicon of Polish. All resources are distributed under the LGPL-LR license."
}
Markdown (Informal)
[A Phonemic Corpus of Polish Child-Directed Speech](https://preview.aclanthology.org/fix-sig-urls/L12-1660/) (Boruta & Jastrzebska, LREC 2012)
ACL
- Luc Boruta and Justyna Jastrzebska. 2012. A Phonemic Corpus of Polish Child-Directed Speech. In Proceedings of the Eighth International Conference on Language Resources and Evaluation (LREC'12), pages 1017–1020, Istanbul, Turkey. European Language Resources Association (ELRA).