@inproceedings{NIPS2012_28f0b864, author = {Liu, Bo and Mahadevan, Sridhar and Liu, Ji}, booktitle = {Advances in Neural Information Processing Systems}, editor = {F. Pereira and C.J. Burges and L. Bottou and K.Q. Weinberger}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Regularized Off-Policy TD-Learning}, url = {https://proceedings.neurips.cc/paper_files/paper/2012/file/28f0b864598a1291557bed248a998d4e-Paper.pdf}, volume = {25}, year = {2012} }