Tianbing Xu, Qiang Liu 0001, Liang Zhao, Jian Peng 0001
Learning to Explore via Meta-Policy Gradient
ICML, 2018.
@inproceedings{ICML-2018-XuLZP,
author = "Tianbing Xu and Qiang Liu 0001 and Liang Zhao and Jian Peng 0001",
booktitle = "{Proceedings of the 35th International Conference on Machine Learning}",
ee = "http://proceedings.mlr.press/v80/xu18d.html",
pages = "5459--5468",
publisher = "{PMLR}",
title = "{Learning to Explore via Meta-Policy Gradient}",
year = 2018,
}











