@inproceedings{hong-etal-2024-text, title = "Text-to-Song: Towards Controllable Music Generation Incorporating Vocal and Accompaniment", author = "Hong, Zhiqing and Huang, Rongjie and Cheng, Xize and Wang, Yongqi and Li, Ruiqi and You, Fuming and Zhao, Zhou and Zhang, Zhimeng", editor = "Ku, Lun-Wei and Martins, Andre and Srikumar, Vivek", booktitle = "Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)", month = aug, year = "2024", address = "Bangkok, Thailand", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.acl-long.339/", doi = "10.18653/v1/2024.acl-long.339", pages = "6248--6261" }