@inproceedings{takeda-komatani-2017-unsupervised,
title = "Unsupervised Segmentation of Phoneme Sequences based on {P}itman-{Y}or Semi-{M}arkov Model using Phoneme Length Context",
author = "Takeda, Ryu and
Komatani, Kazunori",
editor = "Kondrak, Greg and
Watanabe, Taro",
booktitle = "Proceedings of the Eighth International Joint Conference on Natural Language Processing (Volume 1: Long Papers)",
month = nov,
year = "2017",
address = "Taipei, Taiwan",
publisher = "Asian Federation of Natural Language Processing",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/I17-1025/",
pages = "243--252",
abstract = "Unsupervised segmentation of phoneme sequences is an essential process to obtain unknown words during spoken dialogues. In this segmentation, an input phoneme sequence without delimiters is converted into segmented sub-sequences corresponding to words. The Pitman-Yor semi-Markov model (PYSMM) is promising for this problem, but its performance degrades when it is applied to phoneme-level word segmentation. This is because of insufficient cues for the segmentation, e.g., homophones are improperly treated as single entries and their different contexts are also confused. We propose a phoneme-length context model for PYSMM to give a helpful cue at the phoneme-level and to predict succeeding segments more accurately. Our experiments showed that the peak performance with our context model outperformed those without such a context model by 0.045 at most in terms of F-measures of estimated segmentation."
}
Markdown (Informal)
[Unsupervised Segmentation of Phoneme Sequences based on Pitman-Yor Semi-Markov Model using Phoneme Length Context](https://preview.aclanthology.org/jlcl-multiple-ingestion/I17-1025/) (Takeda & Komatani, IJCNLP 2017)
ACL