@inproceedings{hai2025_interspeech,
author = {Hai, Jiarui and Xu, Yong and Zhang, Hao and Li, Chenxing and Wang, Helin and Elhilali, Mounya and Yu, Dong},
booktitle = {Interspeech 2025},
doi = {10.21437/Interspeech.2025-1137},
pages = {4233--4237},
title = {{EzAudio: Enhancing Text-to-Audio Generation with Efficient Diffusion Transformer}},
url = {https://www.isca-archive.org/interspeech{\_}2025/hai25{\_}interspeech.pdf},
year = {2025}
}