Romain Laroche, Paul Trichelair, Remi Tachet des Combes
Safe Policy Improvement with Baseline Bootstrapping
ICML, 2019.
@inproceedings{ICML-2019-LarocheTC, author = "Romain Laroche and Paul Trichelair and Remi Tachet des Combes", booktitle = "{Proceedings of the 36th International Conference on Machine Learning}", ee = "http://proceedings.mlr.press/v97/laroche19a.html", pages = "3652--3661", publisher = "{PMLR}", title = "{Safe Policy Improvement with Baseline Bootstrapping}", year = 2019, }