Dennis J. N. J. Soemers, Éric Piette, Matthew Stephenson, Cameron Browne
Learning Policies from Self-Play with Policy Gradients and MCTS Value Estimates
CoG, 2019.
@inproceedings{CoG-2019-SoemersPSB, author = "Dennis J. N. J. Soemers and Éric Piette and Matthew Stephenson and Cameron Browne", booktitle = "{Proceedings of the IEEE Conference on Games}", doi = "10.1109/CIG.2019.8848037", isbn = "978-1-7281-1884-0", pages = "1--8", publisher = "{IEEE}", title = "{Learning Policies from Self-Play with Policy Gradients and MCTS Value Estimates}", year = 2019, }