@inproceedings{0463996b87684c47a36f714c7ec44e76,
title = "Q\_learning based on active backup and memory mechanism",
abstract = "Exploration is used in Q\_learning because the agent will be caught in locally optimal policies due to blind exploitation. However excessive exploration will degrade the performance of Q\_learning and it is difficult to meet the trade-off between exploration and exploitation. In this paper, the active backup is introduced into Q\_learning and the corresponding algorithm AB\_Q\_learning based on Dijkstra backup in dynamic programming is proposed. Then, the memory mechanism based MEAB\_Q\_learning algorithm is given for the agent to learn in completely unknown environment. The experimental results show that these two algorithms not only converge more quickly, but also solve the problem of local optimization.",
keywords = "Dijkstra backup, Q\_learning, Reinforcement learning",
author = "Yang Liu and Guo, \{Mao Zu\} and Yao, \{Hong Xun\}",
year = "2004",
language = "英语",
isbn = "0780384032",
series = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics",
pages = "271--275",
booktitle = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics",
note = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics ; Conference date: 26-08-2004 Through 29-08-2004",
}