Makoto Sato, Shigenobu Kobayashi
Average-Reward Reinforcement Learning for Variance Penalized Markov Decision Problems
ICML, 2001.
@inproceedings{ICML-2001-SatoK, author = "Makoto Sato and Shigenobu Kobayashi", booktitle = "{Proceedings of the 18th International Conference on Machine Learning}", isbn = "1-55860-778-1", pages = "473--480", publisher = "{Morgan Kaufmann}", title = "{Average-Reward Reinforcement Learning for Variance Penalized Markov Decision Problems}", year = 2001, }