@inproceedings{guan2025cot, title={CoT-VTM: Visual-to-Music Generation with Chain-of-Thought Reasoning}, author={Guan, Xikang and Gu, Zheng and Huo, Jing and Ding, Tianyu and Gao, Yang}, booktitle={Findings of the Association for Computational Linguistics: ACL 2025}, pages={12493--12510}, year={2025} }