@inproceedings{NEURIPS2019_9e984c10, author = {Zhang, Zihan and Ji, Xiangyang}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Wallach and H. Larochelle and A. Beygelzimer and F. d\textquotesingle Alch\'{e}-Buc and E. Fox and R. Garnett}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Regret Minimization for Reinforcement Learning by Evaluating the Optimal Bias Function}, url = {https://proceedings.neurips.cc/paper_files/paper/2019/file/9e984c108157cea74c894b5cf34efc44-Paper.pdf}, volume = {32}, year = {2019} }