@inproceedings{halabi-wald-2016-phonetic,
title = "Phonetic Inventory for an {A}rabic Speech Corpus",
author = "Halabi, Nawar and
Wald, Mike",
booktitle = "Proceedings of the Tenth International Conference on Language Resources and Evaluation ({LREC}'16)",
month = may,
year = "2016",
address = "Portoro{\v{z}}, Slovenia",
publisher = "European Language Resources Association (ELRA)",
url = "https://aclanthology.org/L16-1116",
pages = "734--738",
abstract = "Corpus design for speech synthesis is a well-researched topic in languages such as English compared to Modern Standard Arabic, and there is a tendency to focus on methods to automatically generate the orthographic transcript to be recorded (usually greedy methods). In this work, a study of Modern Standard Arabic (MSA) phonetics and phonology is conducted in order to create criteria for a greedy method to create a speech corpus transcript for recording. The size of the dataset is reduced a number of times using these optimisation methods with different parameters to yield a much smaller dataset with identical phonetic coverage than before the reduction, and this output transcript is chosen for recording. This is part of a larger work to create a completely annotated and segmented speech corpus for MSA.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="halabi-wald-2016-phonetic">
<titleInfo>
<title>Phonetic Inventory for an Arabic Speech Corpus</title>
</titleInfo>
<name type="personal">
<namePart type="given">Nawar</namePart>
<namePart type="family">Halabi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mike</namePart>
<namePart type="family">Wald</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2016-may</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC’16)</title>
</titleInfo>
<originInfo>
<publisher>European Language Resources Association (ELRA)</publisher>
<place>
<placeTerm type="text">Portorož, Slovenia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Corpus design for speech synthesis is a well-researched topic in languages such as English compared to Modern Standard Arabic, and there is a tendency to focus on methods to automatically generate the orthographic transcript to be recorded (usually greedy methods). In this work, a study of Modern Standard Arabic (MSA) phonetics and phonology is conducted in order to create criteria for a greedy method to create a speech corpus transcript for recording. The size of the dataset is reduced a number of times using these optimisation methods with different parameters to yield a much smaller dataset with identical phonetic coverage than before the reduction, and this output transcript is chosen for recording. This is part of a larger work to create a completely annotated and segmented speech corpus for MSA.</abstract>
<identifier type="citekey">halabi-wald-2016-phonetic</identifier>
<location>
<url>https://aclanthology.org/L16-1116</url>
</location>
<part>
<date>2016-may</date>
<extent unit="page">
<start>734</start>
<end>738</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Phonetic Inventory for an Arabic Speech Corpus
%A Halabi, Nawar
%A Wald, Mike
%S Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC’16)
%D 2016
%8 may
%I European Language Resources Association (ELRA)
%C Portorož, Slovenia
%F halabi-wald-2016-phonetic
%X Corpus design for speech synthesis is a well-researched topic in languages such as English compared to Modern Standard Arabic, and there is a tendency to focus on methods to automatically generate the orthographic transcript to be recorded (usually greedy methods). In this work, a study of Modern Standard Arabic (MSA) phonetics and phonology is conducted in order to create criteria for a greedy method to create a speech corpus transcript for recording. The size of the dataset is reduced a number of times using these optimisation methods with different parameters to yield a much smaller dataset with identical phonetic coverage than before the reduction, and this output transcript is chosen for recording. This is part of a larger work to create a completely annotated and segmented speech corpus for MSA.
%U https://aclanthology.org/L16-1116
%P 734-738
Markdown (Informal)
[Phonetic Inventory for an Arabic Speech Corpus](https://aclanthology.org/L16-1116) (Halabi & Wald, LREC 2016)
ACL
- Nawar Halabi and Mike Wald. 2016. Phonetic Inventory for an Arabic Speech Corpus. In Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC'16), pages 734–738, Portorož, Slovenia. European Language Resources Association (ELRA).