@inproceedings{NEURIPS2020_d1419302, author = {Anthony, Thomas and Eccles, Tom and Tacchetti, Andrea and Kram\'{a}r, J\'{a}nos and Gemp, Ian and Hudson, Thomas and Porcel, Nicolas and Lanctot, Marc and Perolat, Julien and Everett, Richard and Singh, Satinder and Graepel, Thore and Bachrach, Yoram}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {17987--18003}, publisher = {Curran Associates, Inc.}, title = {Learning to Play No-Press Diplomacy with Best Response Policy Iteration}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/d1419302db9c022ab1d48681b13d5f8b-Paper.pdf}, volume = {33}, year = {2020} }