@inproceedings{e9ba328120684c04ae86fa1e5882f137,
title = "Bayes-tomop: A fast detection and best response algorithm towards sophisticated opponents",
abstract = "Multiagent algorithms often aim to accurately predict the behaviors of other agents and find a best response accordingly. Previous works usually assume an opponent uses a stationary strategy or randomly switches among several stationary ones. However, an opponent may exhibit more sophisticated behaviors by adopting more advanced reasoning strategies, e.g., using a Bayesian reasoning strategy. This paper proposes a novel approach called Bayes-ToMoP which can efficiently detect the strategy of opponents using either stationary or higher-level reasoning strategies. Bayes-ToMoP also supports the detection of previously unseen policies and learning a best-response policy accordingly. We also propose a deep version of Bayes-ToMoP by extending Bayes-ToMoP with DRL techniques. Experimental results show both Bayes-ToMoP and deep Bayes-ToMoP outperform the state-of-the-art approaches when faced with different types of opponents in two-agent competitive games.",
keywords = "Multiagent learning, Policy reuse, Theory of mind",
author = "Tianpei Yang and Jianye Hao and Zhaopeng Meng and Yan Zheng and Chongjie Zhang and Ze Zheng",
note = "Publisher Copyright: {\textcopyright} 2019 International Foundation for Autonomous Agents and Multiagent Systems (IFAAMAS). All rights reserved.; 18th International Conference on Autonomous Agents and Multiagent Systems, AAMAS 2019 ; Conference date: 13-05-2019 Through 17-05-2019",
year = "2019",
language = "English",
series = "Proceedings of the International Joint Conference on Autonomous Agents and Multiagent Systems, AAMAS",
publisher = "International Foundation for Autonomous Agents and Multiagent Systems (IFAAMAS)",
pages = "2282--2284",
booktitle = "18th International Conference on Autonomous Agents and Multiagent Systems, AAMAS 2019",
}