John Schulman, Sergey Levine, Pieter Abbeel, Michael I. Jordan, Philipp Moritz
Trust Region Policy Optimization
ICML, 2015.
@inproceedings{ICML-2015-SchulmanLAJM,
author = "John Schulman and Sergey Levine and Pieter Abbeel and Michael I. Jordan and Philipp Moritz",
booktitle = "{Proceedings of the 32nd International Conference on Machine Learning}",
ee = "http://jmlr.org/proceedings/papers/v37/schulman15.html",
pages = "1889--1897",
publisher = "{JMLR.org}",
series = "{JMLR Proceedings}",
title = "{Trust Region Policy Optimization}",
volume = 37,
year = 2015,
}
Tags: