@inproceedings{a16ada6158544b52a8ebf91f8902df12,
title = "On Multi-input Multi-frame MVDR Filter for Speech Enhancement with Heterophasic Presentation",
abstract = "Multi-channel speech enhancement attempts to recover a target speech signal from noisy observations by exploiting spatial information captured by a microphone array. Conventional approaches typically produce a single output that contains both the desired speech and some residual noise, which neglects the benefits of human binaural hearing system. To overcome this limitation, we propose in this work a multi-input multi-frame binaural-output (MIMFBO) noise reduction method operating in the short-time-Fourier-transform (STFT) domain. This method utilizes both inter-channel and inter-frame correlations to design binaural filters that maximize the interaural coherence (IC) of the desired speech signal while minimizing the IC of the noise, all under distortionless constraints for the desired target speech. As a result, the perceived target signal and residual noise are spatially separated, substantially enhancing speech intelligibility. Simulation results demonstrate the proposed method{\textquoteright}s superiority, showing significant improvements in PESQ scores over both the single-input binaural-output MVDR and multi-input binaural-output MVDR approaches. Moreover, subjective listening tests confirm its perceptual benefits.",
keywords = "heterophasic presentation, Multi-channel binaural-output speech enhancement, MVDR filter, noise reduction",
author = "Zixuan Chen and Hanchen Pei and Jilu Jin and Xueqin Luo and Ningning Pan and Gongping Huang and Jingdong Chen and Jacob Benesty",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2026.; 20th National Conference on Man-Machine Speech Communication, NCMMSC 2025 ; Conference date: 16-10-2025 Through 19-10-2025",
year = "2026",
doi = "10.1007/978-981-95-5382-2\_31",
language = "英语",
isbn = "9789819553815",
series = "Communications in Computer and Information Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "408--421",
editor = "Jia Jia and Zhiyong Wu and Lijian Gao and Gongping Huang and Ya Li",
booktitle = "Man-Machine Speech Communication - 20th National Conference, NCMMSC 2025, Proceedings",
}