@inproceedings{aa955cb69c214837a49449bca5647b7c,
title = "Test-Time Adaptation Toward Personalized Speech Enhancement: Zero-Shot Learning with Knowledge Distillation",
abstract = "In realistic speech enhancement settings for end-user devices, we often encounter only a few speakers and noise types that tend to reoccur in the specific acoustic environment. We propose a novel personalized speech enhancement method to adapt a compact denoising model to the test-time specificity. Our goal in this test-time adaptation is to utilize no clean speech target of the test speaker, thus fulfilling the requirement for zero-shot learning. To complement the lack of clean speech, we employ the knowledge distillation framework: we distill the more advanced denoising results from an overly large teacher model, and use them as the pseudo target to train the small student model. This zero-shot learning procedure circumvents the process of collecting users' clean speech, a process that users are reluctant to comply due to privacy concerns and technical difficulty of recording clean voice. Experiments on various test-time conditions show that the proposed personalization method can significantly improve the compact models' performance during the test time. Furthermore, since the personalized models outperform larger non-personalized baseline models, we claim that personalization achieves model compression with no loss of denoising performance. As expected, the student models underperform the state-of-the-art teacher models.",
keywords = "knowledge distillation, model compression, personalization, Speech enhancement, zero-shot learning",
author = "Sunwoo Kim and Minje Kim",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021 ; Conference date: 17-10-2021 Through 20-10-2021",
year = "2021",
doi = "10.1109/WASPAA52581.2021.9632771",
language = "English (US)",
series = "IEEE Workshop on Applications of Signal Processing to Audio and Acoustics",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "176--180",
booktitle = "2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021",
address = "United States",
}