@inproceedings{fff4854342cf47f2ae71c3dfe5eba994,
title = "A Differential Quantization Based END-TO-END Neural Speech Codec",
abstract = "Speech codecs efficiently compress speech signals, reducing the bandwidth occupied during communication. With the development of neural networks and deep learning, end-to-end speech codecs based on neural network structures have emerged. Compared to traditional codecs, these neural speech codecs can reconstruct higher-quality speech at lower bitrates. However, the performance of neural speech codecs drastically deteriorates when the communication bitrate drops to 1 kbps or below, as these codecs are based on residual quantization, which has limited performance at low bitrates. In this paper, a differential quantization based neural speech codec is proposed. In particular, the quantization focuses on the importance of difference frames and preserves key information with as few bits as possible. Meanwhile, we propose a compensator to further improve the reconstructed speech quality. Both subjective and objective evaluations demonstrate that our proposed method can achieve a higher quality of reconstructed speech at 0.6 kbps than SoundStream at 3 kbps. The entire model is causal, supporting streaming and real-time inference.",
keywords = "low bitrate, neural speech codec, vector quantization",
author = "Pincheng Lu and Liang Xu and Jing Wang",
note = "Publisher Copyright: {\textcopyright}2024 IEEE.; 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024 ; Conference date: 07-11-2024 Through 10-11-2024",
year = "2024",
doi = "10.1109/ISCSLP63861.2024.10800135",
language = "English",
series = "2024 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "71--75",
editor = "Yanmin Qian and Qin Jin and Zhijian Ou and Zhenhua Ling and Zhiyong Wu and Ya Li and Lei Xie and Jianhua Tao",
booktitle = "2024 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024",
address = "United States",
}