@inproceedings{a0919bdb16fe45f2b88f3fa7fa548a73,
title = "Noise-robust voice activity detector based on hidden semi-Markov models",
abstract = "This paper concentrates on speech duration distributions that are usually invariant to noises and proposes a noise-robust and real-time voice activity detector (VAD) using the hidden semi-Markov model (HSMM) to explicitly model state durations. Motivated by statistical observations and tests on TIMIT and the IEEE sentence database, we use Weibull distributions to model state durations approximately and estimate their parameters by maximum likelihood estimators. The final VAD decision is made according to the likelihood ratio test (LRT) incorporating state prior knowledge and modified forward variables. An efficient way that recursively calculates modified forward variables is devised and a dynamic adjustment scheme is used to update parameters. Experiments on noisy speech data show that the proposed method performs more robustly and accurately than the standard ITU-T G.729B VAD and AMR2.",
author = "Xianglong Liu and Yuan Liang and Yihua Lou and He Li and Baosong Shan",
year = "2010",
doi = "10.1109/ICPR.2010.28",
language = "英语",
isbn = "9780769541099",
series = "Proceedings - International Conference on Pattern Recognition",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "81--84",
booktitle = "Proceedings - 2010 20th International Conference on Pattern Recognition, ICPR 2010",
address = "美国",
}