@inproceedings{075a779f72904d039a19e7284f40c2d4,
title = "Large vocabulary Korean continuous speech recognition using a one-pass algorithm",
abstract = "In this paper, we describe problems in recognizing largevocabulary Korean continuous speech, and proposed solutions to them. Korean sentences consist of eojeols, which are separated by spaces in text and consist of morphemes. When we use morpheme units, there are many word insertion and deletion errors because morpheme units are too short. We introduce a between-word phone variation lexicon that can represent many alternatives of phones of words in one structure. The decoding algorithm is composed of one pass, which is a modification of token-passing algorithm. In this algorithm, we allowed multiple tokens in a state at a time to get globalbest path without expanding the states when we use trigram language models. We confirmed thatbetween-word phone variation lexicon is useful for morpheme-based recognition by observing that the improvement is higher for morpheme units than for eojeol units. Allowing multiple tokens at a state also improved the performance.",
author = "Yu, \{Ha Jin\} and Hoon Kim and Hong, \{Joon Mo\} and Kim, \{Min Seong\} and Lee, \{Jong Seok\}",
year = "2000",
language = "English",
series = "6th International Conference on Spoken Language Processing, ICSLP 2000",
publisher = "International Speech Communication Association",
booktitle = "6th International Conference on Spoken Language Processing, ICSLP 2000",
note = "6th International Conference on Spoken Language Processing, ICSLP 2000 ; Conference date: 16-10-2000 Through 20-10-2000",
}