Jonathan Baxter, Peter L. Bartlett
Reinforcement Learning in POMDP’s via Direct Gradient Ascent
ICML, 2000.
@inproceedings{ICML-2000-BaxterB,
author = "Jonathan Baxter and Peter L. Bartlett",
booktitle = "{Proceedings of the 17th International Conference on Machine Learning}",
isbn = "1-55860-707-2",
pages = "41--48",
publisher = "{Morgan Kaufmann}",
title = "{Reinforcement Learning in POMDP’s via Direct Gradient Ascent}",
year = 2000,
}











