Theodore J. Perkins, Mark D. Pendrith
On the Existence of Fixed Points for Q-Learning and Sarsa in Partially Observable Domains
ICML, 2002.
@inproceedings{ICML-2002-PerkinsP, author = "Theodore J. Perkins and Mark D. Pendrith", booktitle = "{Proceedings of the 19th International Conference on Machine Learning}", isbn = "1-55860-873-7", pages = "490--497", publisher = "{Morgan Kaufmann}", title = "{On the Existence of Fixed Points for Q-Learning and Sarsa in Partially Observable Domains}", year = 2002, }