@inproceedings{0eb19467597a458181c673f90d2bc676,
title = "Investigating neural network based query-by-example keyword spotting approach for personalized wake-up word detection in Mandarin Chinese",
abstract = "We use query-by-example keyword spotting (QbyE-KWS) approach to solve the personalized wake-up word detection problem for small-footprint, low-computational cost on-device applications. QbyE-KWS takes keywords as templates, and matches the templates across an audio stream via DTW to see if the keyword is included. In this paper, we use neural networks as acoustic models to extract DNN/LSTM phoneme posterior features and LSTM embedding features. Specifically, we investigate the LSTM embedding feature extractor for different modeling units in Mandarin, spanning from phonemes to words. We also study the performances of two popular DTW approaches: S-DTW and SLN-DTW. SLN-DTW manages to accurately and effectively search the keyword in a long audio stream without the segmentation procedure that is used in S-DTW approaches. Our study shows that DNN phoneme posterior plus SLN-DTW approach achieves the highest computation efficiency and the state-of-the-art performance with 78% relative miss rate reduction as compared with the S-DTW approach. Word level LSTM embedding feature shows superior performance as compared with other embedding units.",
keywords = "DNN, DTW, LSTM, Query-by-Example, Spotting, Wake-up Word Detection",
author = "Jingyong Hou and Lei Xie and Zhonghua Fu",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016 ; Conference date: 17-10-2016 Through 20-10-2016",
year = "2017",
month = may,
day = "2",
doi = "10.1109/ISCSLP.2016.7918366",
language = "英语",
series = "Proceedings of 2016 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
editor = "Hsin-Min Wang and Qingzhi Hou and Yuan Wei and Tan Lee and Jianguo Wei and Lei Xie and Hui Feng and Jianwu Dang and Jianwu Dang",
booktitle = "Proceedings of 2016 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016",
}