@inproceedings{d9bebe3b98ce43a2ab58dcb8bbe90774,
title = "Acoustic TextTiling for story segmentation of spoken documents",
abstract = "We propose an acoustic TextTiling method based on segmental dynamic time warping for automatic story segmentation of spoken documents. Different from most of the existing methods using LVCSR transcripts, this method detects story boundaries directly from audio streams. In analogy to the cosine-based lexical similarity between two text blocks in a transcript, we define the acoustic similarity measure between two pseudo-sentences in an audio stream. Experiments on TDT2 Mandarin corpus show that acoustic TextTiling can achieve comparable performance to lexical TextTiling based on LVCSR transcripts. Moreover, we use MFCCs and Gaussian posteriorgrams as the acoustic representations in our experiments. Our experiments show that Gaussian posteriorgrams are more robust to perform segmentation for the stories each with multiple speakers.",
keywords = "segmental dynamic time warping, spoken document processing, story segmentation, TextTiling, topic segmentation",
author = "Lilei Zheng and Leung, {Cheung Chi} and Lei Xie and Bin Ma and Haizhou Li",
year = "2012",
doi = "10.1109/ICASSP.2012.6289073",
language = "英语",
isbn = "9781467300469",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
pages = "5121--5124",
booktitle = "2012 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2012 - Proceedings",
note = "2012 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2012 ; Conference date: 25-03-2012 Through 30-03-2012",
}