Masrour Zoghi, Shimon Whiteson, Rémi Munos, Maarten de Rijke
Relative Upper Confidence Bound for the K-Armed Dueling Bandit Problem
ICML, 2014.
@inproceedings{ICML-c2-2014-ZoghiWMR, author = "Masrour Zoghi and Shimon Whiteson and Rémi Munos and Maarten de Rijke", booktitle = "{Proceedings of the 31st International Conference on Machine Learning, Cycle 2}", ee = "http://jmlr.org/proceedings/papers/v32/zoghi14.html", pages = "10--18", publisher = "{JMLR.org}", series = "{JMLR Proceedings}", title = "{Relative Upper Confidence Bound for the K-Armed Dueling Bandit Problem}", volume = 32, year = 2014, }