@inproceedings{pan:neurips21, title = "Regularized Softmax Deep Multi-Agent Q-Learning", author = "Ling Pan and Tabish Rashid and Bei Peng and Longbo Huang and Shimon Whiteson", year = "2021", booktitle = "NeurIPS 2021: Proceedings of the Thirty-fifth Annual Conference on Neural Information Processing Systems", month = "December", url = "https://openreview.net/pdf?id=BGS3o8SpjI3", }