@inproceedings{6f454f2087584da3aec8834d9f013d5f,
title = "Imitation Learning Method of Multi-quality Expert Data Based on GAIL",
abstract = "This paper focuses on the imitation learning methods of multi-quality expert data based on Generative Adversarial Imitation Learning (GAIL). The agent is able to acquire high-quality behavioral policies through GAIL by imitating actions from experts and learning the experience distribution instead of the reward function. Considering that multi-quality expert imitation learning can achieve the effect of data augmentation, a novel GAIL-based method named MT-GAIL is proposed for imitation learning. We first define the reliability coefficient of different expert data by calculating the accuracy of corresponding discriminator. Then the reliability coefficient is used as the weight to calculate the reward function that is defined as the sum of the products of the weights and the output of corresponding discriminator. The series of rewards, states and actions are finally fed into the experience pool to train the network of policy builder. We compare the GAIL method through experiments for the cases of single-expert and multi-quality expert trajectories, which shows that the proposed MT-GAIL method is capable of avoiding the worst expert data. The effects of different reward value calculation methods on multi-quality expert data are also conducted to illustrate the distinct advantage of our proposed discriminator output value weighting method.",
keywords = "GAIL, Mujoco, imitation learning, multi-quality expert data",
author = "Dengmin Xiao and Bo Wang and Zhongqi Sun and Xiao He",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 2023 China Automation Congress, CAC 2023 ; Conference date: 17-11-2023 Through 19-11-2023",
year = "2023",
doi = "10.1109/CAC59555.2023.10451805",
language = "English",
series = "Proceedings - 2023 China Automation Congress, CAC 2023",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "8642--8647",
booktitle = "Proceedings - 2023 China Automation Congress, CAC 2023",
address = "United States",
}