@inproceedings{4cf87149e02b484b9207e11cbb2f1e69,
title = "LDCCRN: Robust Deep Learning-based Speech Enhancement",
abstract = "Deep learning-based speech enhancement methods make use of their non-linearity properties to estimate the speech and noise signals, especially the non-stationary noise. DCCRN, in particular, achieves state-of-the-art performance on speech intelligibility. However, the non-linear property also causes concern about the robustness of the method. Novel and unexpected noises can be generated if the noisy input speech is beyond the operation condition of the method. In this paper, we propose a hybrid framework called LDCCRN, which integrates a traditional speech enhancement method LogMMSE-EM and DCCRN. The proposed framework leverages the strength of both approaches to improve the robustness in speech enhancement. While the DCCRN continues to remove the non-stationary noise in the speech, the novel noises generated by DCCRN, if any, are effectively suppressed by LogMMSE-EM. As shown in our experimental results, the proposed method achieves better performance over the traditional approaches measured with standard evaluation methods.",
keywords = "complex-network, deep learning denoise, Speech enhancement",
author = "Yeung, {Chun Yin} and Mung, {Steve W.Y.} and Choy, {Yat Sze} and Lun, {Daniel P.K.}",
note = "Funding Information: *The work described in this paper was fully supported by a grant from the Innovation and Technology Commission of the Hong Kong Special Administrative Region, China (Project No. UIM/381). Chun-Yin Yeung, Steve W.Y. Mung, and Daniel P.K. Lun are with the Dept. of EIE and Yat Sze Choy is with the Dept. of ME of the Hong Kong Polytechnic University, Hong Kong, China. (Corresponding author: Dr Daniel P.K. Lun, e-mail:
[email protected]). Publisher Copyright: {\textcopyright} 2022 SPIE.; 2022 International Workshop on Advanced Imaging Technology, IWAIT 2022 ; Conference date: 04-01-2022 Through 06-01-2022",
year = "2022",
month = apr,
day = "30",
doi = "10.1117/12.2626108",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Masayuki Nakajima and Shogo Muramatsu and Jae-Gon Kim and Jing-Ming Guo and Qian Kemao",
booktitle = "International Workshop on Advanced Imaging Technology, IWAIT 2022",
address = "United States",
}