Richard S. Sutton, Ashique Rupam Mahmood, Doina Precup, Hado van Hasselt
A new Q(λ) with interim forward view and Monte Carlo equivalence
ICML, 2014.
@inproceedings{ICML-c2-2014-SuttonMPH,
author = "Richard S. Sutton and Ashique Rupam Mahmood and Doina Precup and Hado van Hasselt",
booktitle = "{Proceedings of the 31st International Conference on Machine Learning, Cycle 2}",
ee = "http://jmlr.org/proceedings/papers/v32/sutton14.html",
pages = "568--576",
publisher = "{JMLR.org}",
series = "{JMLR Proceedings}",
title = "{A new Q(λ) with interim forward view and Monte Carlo equivalence}",
volume = 32,
year = 2014,
}
Tags: