Jonathan Baxter, Peter L. Bartlett
Reinforcement Learning in POMDP’s via Direct Gradient Ascent
ICML, 2000.
@inproceedings{ICML-2000-BaxterB, author = "Jonathan Baxter and Peter L. Bartlett", booktitle = "{Proceedings of the 17th International Conference on Machine Learning}", isbn = "1-55860-707-2", pages = "41--48", publisher = "{Morgan Kaufmann}", title = "{Reinforcement Learning in POMDP’s via Direct Gradient Ascent}", year = 2000, }