@inproceedings{ed10223694814a4e9e410990976eea85,
title = "Novel entropy based moving average refiners for HMM landmarks",
abstract = "The training of precise speech recognition models depends on accurate segmentation of the phonemes in a training corpus. Segmentation is typically performed using HMMs, but recent speech recognition work suggests that the transient acoustic features characteristic of manner-class phoneme boundaries (landmarks) may be more precisely localized using acoustic classifiers specifically designed for the task of landmark detection. This paper makes an empirical exploration of entropy based moving average techniques that are capable of improving the time alignment of phoneme boundaries proposed by an HMM-based speech recognizer. On a standard benchmark data set (A database of Hindi - National Language of India), we achieve new state-of-the-art performance, reducing RMS phone boundary alignment error from 28ms to 15ms.",
keywords = "Entropy, Landmark, Moving average, Segmentation",
author = "Rahul Chitturi and Johnson, {Mark Hasegawa}",
year = "2006",
language = "English (US)",
isbn = "9781604234497",
series = "INTERSPEECH 2006 and 9th International Conference on Spoken Language Processing, INTERSPEECH 2006 - ICSLP",
publisher = "International Speech Communication Association",
pages = "1682--1685",
booktitle = "INTERSPEECH 2006 and 9th International Conference on Spoken Language Processing, INTERSPEECH 2006 - ICSLP",
note = "INTERSPEECH 2006 and 9th International Conference on Spoken Language Processing, INTERSPEECH 2006 - ICSLP ; Conference date: 17-09-2006 Through 21-09-2006",
}