@inproceedings{db5d9e7a31d3436085e12f4f01cdaf21,
title = "A two-stage multi-feature integration approach to unsupervised speaker change detection in real-time news broadcasting",
abstract = "This paper presents a two-stage multi-feature integration approach for unsupervised speaker change detection in real-time news broadcasting. We integrate MFCC and LSP features (i.e. a perceptual feature plus a articulatory feature) in the metric-based potential speaker change detection stage to collect speaker boundary candidates as many as possible. We adopt a weighted Bayesian information criterion (BIC) to integrate boundary decisions from MFCC and LSP features in the speaker boundary confirmation stage. This multi-feature integration strategy makes use of the complementarity between perceptual features and articulatory features to achieve a performance gain. Speaker change detection experiments show that the multi-feature integration approach significantly outperforms the individual features with relative improvements of 26% over the LSP-only approach and 6% over the MFCC-only approach.",
keywords = "Audio content analysis, Audio segmentation, Speaker change detection, Speaker segmentation",
author = "Lei Xie and Guangsen Wang",
year = "2008",
doi = "10.1109/CHINSL.2008.ECP.99",
language = "英语",
isbn = "9781424429431",
series = "Proceedings - 2008 6th International Symposium on Chinese Spoken Language Processing, ISCSLP 2008",
pages = "350--353",
booktitle = "Proceedings - 2008 6th International Symposium on Chinese Spoken Language Processing, ISCSLP 2008",
note = "2008 6th International Symposium on Chinese Spoken Language Processing, ISCSLP 2008 ; Conference date: 16-12-2008 Through 19-12-2008",
}