@inproceedings{1f3061f8b7be46d6b312cb0de8fdb24f,
title = "End-to-end Oriental Language Speech Recognition with Integrated Language Identification",
abstract = "In recent years, with the rise of human-computer interaction and the successful application of end-to-end models in the field of speech recognition, the construction of end-to-end speech recognition models has received extensive attention. Relying on the multi-task learning method and the connection between language identification and speech recognition, we proposed an end-to-end Transformer model, which is a multilingual speech recognition model integrating language identification. The model takes the speech recognition task as the main task and the language identification task as the auxiliary task. In this paper, the validity of the model is verified by using the datasets of 13 languages in the 2021 Oriental Language Recognition challenge (OLR). The experimental results show that the model constructed in this paper has a relative improvement of 37.46% in the speech recognition task compared with the baseline system proposed by the OLR organizer. The accuracy of language identification reaches 89.70 %. The results can get the fifth place in the 2021 OLR constraint track of speech recognition equally.",
keywords = "End-to-end, Language Identification, Multi-task learning, Oriental Languages, Speech Recognition",
author = "Anbin Qi and Xiang Xie and Qingran Zhan and Chenguang Hu and Xinmei Su",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 International Conference on Machine Learning, Control, and Robotics, MLCR 2022 ; Conference date: 29-10-2022 Through 31-10-2022",
year = "2022",
doi = "10.1109/MLCR57210.2022.00014",
language = "English",
series = "Proceedings - 2022 International Conference on Machine Learning, Control, and Robotics, MLCR 2022",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "27--31",
booktitle = "Proceedings - 2022 International Conference on Machine Learning, Control, and Robotics, MLCR 2022",
address = "United States",
}