Tianbing Xu, Qiang Liu 0001, Liang Zhao, Jian Peng 0001
Learning to Explore via Meta-Policy Gradient
ICML, 2018.
@inproceedings{ICML-2018-XuLZP, author = "Tianbing Xu and Qiang Liu 0001 and Liang Zhao and Jian Peng 0001", booktitle = "{Proceedings of the 35th International Conference on Machine Learning}", ee = "http://proceedings.mlr.press/v80/xu18d.html", pages = "5459--5468", publisher = "{PMLR}", title = "{Learning to Explore via Meta-Policy Gradient}", year = 2018, }