@inproceedings{NEURIPS2022_5b5618e7, author = {Wang, Naigang and Liu, Chi-Chun (Charlie) and Venkataramani, Swagath and Sen, Sanchari and Chen, Chia-Yu and El Maghraoui, Kaoutar and Srinivasan, Vijayalakshmi (Viji) and Chang, Leland}, booktitle = {Advances in Neural Information Processing Systems}, editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh}, pages = {14140--14154}, publisher = {Curran Associates, Inc.}, title = {Deep Compression of Pre-trained Transformer Models}, url = {https://proceedings.neurips.cc/paper_files/paper/2022/file/5b5618e7d061748267d74478b7c5b1ab-Paper-Conference.pdf}, volume = {35}, year = {2022} }