@inproceedings{NEURIPS2019_98baeb82, author = {Cai, Qi and Yang, Zhuoran and Lee, Jason D and Wang, Zhaoran}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Wallach and H. Larochelle and A. Beygelzimer and F. d\textquotesingle Alch\'{e}-Buc and E. Fox and R. Garnett}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Neural Temporal-Difference Learning Converges to Global Optima}, url = {https://proceedings.neurips.cc/paper_files/paper/2019/file/98baeb82b676b662e12a7af8ad9212f6-Paper.pdf}, volume = {32}, year = {2019} }