@inproceedings{8f007a96d7cf497297c72c4ecfc0de94,
title = "Noise robust features for speech/music discrimination in real-time telecommunication",
abstract = "While many efforts have been made in the audio signal classification field, the noise interruption problem is seldom concerned so far, especially in many telecommunication applications, where a real-time and noise robust approach is needed. This paper addresses this problem by proposing two novel robust features: Average Pitch Density (APD) and Relative Tonal Power Density (RTPD). APD refers to the differences in tone characteristics of music and speech signals, and RTPD especially focuses on the distinct properties of the percussion instruments. The comparison experiments are implemented on two databases. The first one is reorganized from the corpus collected by Scheirer et al [3]. The second one consists of data collected from various recording situations. The novel features are compared with several state-of-the-art features and are found to achieve significant robustness.",
keywords = "Audio classification, Musical system, Real cepstrum, Support vector machine",
author = "Fu, {Zhong Hua} and Wang, {Jhing Fa} and Lei Xie",
year = "2009",
doi = "10.1109/ICME.2009.5202561",
language = "英语",
isbn = "9781424442911",
series = "Proceedings - 2009 IEEE International Conference on Multimedia and Expo, ICME 2009",
pages = "574--577",
booktitle = "Proceedings - 2009 IEEE International Conference on Multimedia and Expo, ICME 2009",
note = "2009 IEEE International Conference on Multimedia and Expo, ICME 2009 ; Conference date: 28-06-2009 Through 03-07-2009",
}