@inproceedings{NEURIPS2020_1325cdae, author = {Li, Xian and Cooper Stickland, Asa and Tang, Yuqing and Kong, Xiang}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {1736--1746}, publisher = {Curran Associates, Inc.}, title = {Deep Transformers with Latent Depth}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/1325cdae3b6f0f91a1b629307bf2d498-Paper.pdf}, volume = {33}, year = {2020} }