@inproceedings{3cb1ba8d6c734e5f9510237bfde9ef19,
title = "Non-Intrusive Audio Quality Assessment Based on Deep Neural Network for Subjective MOS Prediction",
abstract = "Non-intrusive audio quality assessment, particularly for subjective MOS prediction for music signal, is crucial in realtime audio communication and playback systems. While network-based methods have been extensively used for objective speech quality assessment, evaluating audio quality presents a greater challenge due to higher sampling rates and more complex signal spectrum. In this paper, we design a non-intrusive audio quality assessment system based on deep neural network for subjective MOS prediction of distorted audio signals. Mixed perceptual features are extracted for signal analysis, and both objective and subjective indicators are utilized as labels for two-step training on simulated data. Besides, we apply improved convolution layers, attention layers, and a type of new loss to improve the performance of our model. The experimental results show that the proposed system performs better than conventional assessment methods in correlation.",
keywords = "Audio quality assessment, Deep learning, MOS prediction, Non-intrusive",
author = "Xinwen Yue and Yupei Zhang and Jianqian Zhang and Zhiyu Li and Jing Wang and Shenghui Zhao",
note = "Publisher Copyright: {\textcopyright}2024 IEEE.; 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024 ; Conference date: 07-11-2024 Through 10-11-2024",
year = "2024",
doi = "10.1109/ISCSLP63861.2024.10800631",
language = "English",
series = "2024 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "76--80",
editor = "Yanmin Qian and Qin Jin and Zhijian Ou and Zhenhua Ling and Zhiyong Wu and Ya Li and Lei Xie and Jianhua Tao",
booktitle = "2024 14th International Symposium on Chinese Spoken Language Processing, ISCSLP 2024",
address = "United States",
}