@inproceedings{NEURIPS2021_51200d29, author = {Rahman, Tanzila and Yang, Mengyu and Sigal, Leonid}, booktitle = {Advances in Neural Information Processing Systems}, editor = {M. Ranzato and A. Beygelzimer and Y. Dauphin and P.S. Liang and J. Wortman Vaughan}, pages = {9774--9787}, publisher = {Curran Associates, Inc.}, title = {TriBERT: Human-centric Audio-visual Representation Learning}, url = {https://proceedings.neurips.cc/paper_files/paper/2021/file/51200d29d1fc15f5a71c1dab4bb54f7c-Paper.pdf}, volume = {34}, year = {2021} }