Nan Jiang, Lihong Li 0001
Doubly Robust Off-policy Value Evaluation for Reinforcement Learning
ICML, 2016.
@inproceedings{ICML-2016-JiangL,
author = "Nan Jiang and Lihong Li 0001",
booktitle = "{Proceedings of the 33rd International Conference on Machine Learning}",
ee = "http://proceedings.mlr.press/v48/jiang16.html",
pages = "652--661",
publisher = "{JMLR.org}",
title = "{Doubly Robust Off-policy Value Evaluation for Reinforcement Learning}",
year = 2016,
}











