@techreport{Hai2024,
author = {Hai, J and Xu, Y and Zhang, H and Li, C and Wang, H and Elhilali, M and Yu, D},
booktitle = {eech and Audio in the Northeast Workshop (SANE)},
title = {{EzAudio: Enhancing Text-to-Audio Generation with Efficient Diffusion Transformer}},
year = {2024}
}