@inproceedings{cao-etal-2020-deformer, title = "{D}e{F}ormer: Decomposing Pre-trained Transformers for Faster Question Answering", author = "Cao, Qingqing and Trivedi, Harsh and Balasubramanian, Aruna and Balasubramanian, Niranjan", editor = "Jurafsky, Dan and Chai, Joyce and Schluter, Natalie and Tetreault, Joel", booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics", month = jul, year = "2020", address = "Online", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2020.acl-main.411/", doi = "10.18653/v1/2020.acl-main.411", pages = "4487--4497" }