Chicheng Zhang, Alekh Agarwal, Hal Daumé III, John Langford 0001, Sahand Negahban
Warm-starting Contextual Bandits: Robustly Combining Supervised and Bandit Feedback
ICML, 2019.
@inproceedings{ICML-2019-ZhangAD0N,
author = "Chicheng Zhang and Alekh Agarwal and Hal Daumé III and John Langford 0001 and Sahand Negahban",
booktitle = "{Proceedings of the 36th International Conference on Machine Learning}",
ee = "http://proceedings.mlr.press/v97/zhang19b.html",
pages = "7335--7344",
publisher = "{PMLR}",
title = "{Warm-starting Contextual Bandits: Robustly Combining Supervised and Bandit Feedback}",
year = 2019,
}
Tags: