@inproceedings{sikveland-etal-2010-spontal,
title = "Spontal-N: A Corpus of Interactional Spoken {N}orwegian",
author = {Sikveland, Rein Ove and
{\"O}ttl, Anton and
Amdal, Ingunn and
Ernestus, Mirjam and
Svendsen, Torbj{\o}rn and
Edlund, Jens},
booktitle = "Proceedings of the Seventh International Conference on Language Resources and Evaluation ({LREC}'10)",
month = may,
year = "2010",
address = "Valletta, Malta",
publisher = "European Language Resources Association (ELRA)",
url = "http://www.lrec-conf.org/proceedings/lrec2010/pdf/314_Paper.pdf",
abstract = "Spontal-N is a corpus of spontaneous, interactional Norwegian. To our knowledge, it is the first corpus of Norwegian in which the majority of speakers have spent significant parts of their lives in Sweden, and in which the recorded speech displays varying degrees of interference from Swedish. The corpus consists of studio quality audio- and video-recordings of four 30-minute free conversations between acquaintances, and a manual orthographic transcription of the entire material. On basis of the orthographic transcriptions, we automatically annotated approximately 50 percent of the material on the phoneme level, by means of a forced alignment between the acoustic signal and pronunciations listed in a dictionary. Approximately seven percent of the automatic transcription was manually corrected. Taking the manual correction as a gold standard, we evaluated several sources of pronunciation variants for the automatic transcription. Spontal-N is intended as a general purpose speech resource that is also suitable for investigating phonetic detail.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="sikveland-etal-2010-spontal">
<titleInfo>
<title>Spontal-N: A Corpus of Interactional Spoken Norwegian</title>
</titleInfo>
<name type="personal">
<namePart type="given">Rein</namePart>
<namePart type="given">Ove</namePart>
<namePart type="family">Sikveland</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Anton</namePart>
<namePart type="family">Öttl</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ingunn</namePart>
<namePart type="family">Amdal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mirjam</namePart>
<namePart type="family">Ernestus</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Torbjørn</namePart>
<namePart type="family">Svendsen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jens</namePart>
<namePart type="family">Edlund</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2010-may</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC’10)</title>
</titleInfo>
<originInfo>
<publisher>European Language Resources Association (ELRA)</publisher>
<place>
<placeTerm type="text">Valletta, Malta</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Spontal-N is a corpus of spontaneous, interactional Norwegian. To our knowledge, it is the first corpus of Norwegian in which the majority of speakers have spent significant parts of their lives in Sweden, and in which the recorded speech displays varying degrees of interference from Swedish. The corpus consists of studio quality audio- and video-recordings of four 30-minute free conversations between acquaintances, and a manual orthographic transcription of the entire material. On basis of the orthographic transcriptions, we automatically annotated approximately 50 percent of the material on the phoneme level, by means of a forced alignment between the acoustic signal and pronunciations listed in a dictionary. Approximately seven percent of the automatic transcription was manually corrected. Taking the manual correction as a gold standard, we evaluated several sources of pronunciation variants for the automatic transcription. Spontal-N is intended as a general purpose speech resource that is also suitable for investigating phonetic detail.</abstract>
<identifier type="citekey">sikveland-etal-2010-spontal</identifier>
<location>
<url>http://www.lrec-conf.org/proceedings/lrec2010/pdf/314_Paper.pdf</url>
</location>
<part>
<date>2010-may</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Spontal-N: A Corpus of Interactional Spoken Norwegian
%A Sikveland, Rein Ove
%A Öttl, Anton
%A Amdal, Ingunn
%A Ernestus, Mirjam
%A Svendsen, Torbjørn
%A Edlund, Jens
%S Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC’10)
%D 2010
%8 may
%I European Language Resources Association (ELRA)
%C Valletta, Malta
%F sikveland-etal-2010-spontal
%X Spontal-N is a corpus of spontaneous, interactional Norwegian. To our knowledge, it is the first corpus of Norwegian in which the majority of speakers have spent significant parts of their lives in Sweden, and in which the recorded speech displays varying degrees of interference from Swedish. The corpus consists of studio quality audio- and video-recordings of four 30-minute free conversations between acquaintances, and a manual orthographic transcription of the entire material. On basis of the orthographic transcriptions, we automatically annotated approximately 50 percent of the material on the phoneme level, by means of a forced alignment between the acoustic signal and pronunciations listed in a dictionary. Approximately seven percent of the automatic transcription was manually corrected. Taking the manual correction as a gold standard, we evaluated several sources of pronunciation variants for the automatic transcription. Spontal-N is intended as a general purpose speech resource that is also suitable for investigating phonetic detail.
%U http://www.lrec-conf.org/proceedings/lrec2010/pdf/314_Paper.pdf
Markdown (Informal)
[Spontal-N: A Corpus of Interactional Spoken Norwegian](http://www.lrec-conf.org/proceedings/lrec2010/pdf/314_Paper.pdf) (Sikveland et al., LREC 2010)
ACL
- Rein Ove Sikveland, Anton Öttl, Ingunn Amdal, Mirjam Ernestus, Torbjørn Svendsen, and Jens Edlund. 2010. Spontal-N: A Corpus of Interactional Spoken Norwegian. In Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10), Valletta, Malta. European Language Resources Association (ELRA).