@article{hajiali2026taming, title = {Taming Data and Transformers for Audio Generation}, author = {Haji-Ali, Moayed and Menapace, Willi and Siarohin, Aliaksandr and Balakrishnan, Guha and Ordonez, Vicente}, year = {2026}, journal = {International Journal of Computer Vision. IJCV 2026}, url = {https://arxiv.org/abs/2406.19388}, }