@inproceedings{NIPS2017_3621f145, author = {Agrawal, Shipra and Jia, Randy}, booktitle = {Advances in Neural Information Processing Systems}, editor = {I. Guyon and U. Von Luxburg and S. Bengio and H. Wallach and R. Fergus and S. Vishwanathan and R. Garnett}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Optimistic posterior sampling for reinforcement learning: worst-case regret bounds}, url = {https://proceedings.neurips.cc/paper_files/paper/2017/file/3621f1454cacf995530ea53652ddf8fb-Paper.pdf}, volume = {30}, year = {2017} }