@inproceedings{791e113082c44a838dd037d1949fd84c,
title = "Combining dynamic reward shaping and action shaping for coordinating multi-agent learning",
abstract = "Coordinating multi-agent reinforcement learning provides a promising approach to scaling learning in large cooperative multi-agent systems. It allows agents to learn local decision policies based on their local observations and rewards, and, meanwhile, coordinates agents' learning processes to ensure the global learning performance. One key question is that how coordination mechanisms impact learning algorithms so that agents' learning processes are guided and coordinated. This paper presents a new shaping approach that effectively integrates coordination mechanisms into local learning processes. This shaping approach uses two-level agent organization structures and combines reward shaping and action shaping. The higher-level agents dynamically and periodically produce the shaping heuristic knowledge based on the learning status of the lower-level agents. The lower-level agents then uses this knowledge to coordinate their local learning processes with other agents. Experimental results show our approach effectively speeds up the convergence of multi-agent learning in large systems.",
keywords = "Action shaping, Multi-agent learning, Organization control, Reward shaping, Supervision",
author = "Xiangbin Zhu and Chongjie Zhang and Victor Lesser",
year = "2013",
doi = "10.1109/WI-IAT.2013.127",
language = "English",
isbn = "9781479929023",
series = "Proceedings - 2013 IEEE/WIC/ACM International Conference on Intelligent Agent Technology, IAT 2013",
publisher = "IEEE Computer Society",
pages = "321--328",
booktitle = "Proceedings - 2013 IEEE/WIC/ACM International Conference on Intelligent Agent Technology, IAT 2013",
note = "2013 12th IEEE/WIC/ACM International Conference on Intelligent Agent Technology, IAT 2013 ; Conference date: 17-11-2013 Through 20-11-2013",
}