@inproceedings{yu-etal-2023-documentnet, title = "{D}ocument{N}et: Bridging the Data Gap in Document Pre-training", author = "Yu, Lijun and Miao, Jin and Sun, Xiaoyu and Chen, Jiayi and Hauptmann, Alexander and Dai, Hanjun and Wei, Wei", editor = "Wang, Mingxuan and Zitouni, Imed", booktitle = "Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing: Industry Track", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2023.emnlp-industry.66/", doi = "10.18653/v1/2023.emnlp-industry.66", pages = "707--722" }