@inproceedings{zhang:icml20b, title = "Provably Convergent Two-Timescale Off-Policy Actor-Critic with Function Approximation", author = "Shangtong Zhang and Bo Liu and Hengshuai Yao and Shimon Whiteson", year = "2020", booktitle = "ICML 2020: Proceedings of the Thirty-Seventh International Conference on Machine Learning", month = "July", url = "http://www.cs.ox.ac.uk/people/shimon.whiteson/pubs/zhangicml20b.pdf", }