Mohammad Ghavamzadeh, Sridhar Mahadevan
Hierarchically Optimal Average Reward Reinforcement Learning
ICML, 2002.
@inproceedings{ICML-2002-GhavamzadehM, author = "Mohammad Ghavamzadeh and Sridhar Mahadevan", booktitle = "{Proceedings of the 19th International Conference on Machine Learning}", isbn = "1-55860-873-7", pages = "195--202", publisher = "{Morgan Kaufmann}", title = "{Hierarchically Optimal Average Reward Reinforcement Learning}", year = 2002, }