@inproceedings{ijcai2025p300, title = {Empowering Multimodal Road Traffic Profiling with Vision Language Models and Frequency Spectrum Fusion}, author = { Xiang, Haolong and Xu, Xiaolong and Wang, Guangdong and Zhang, Xuyun and Li, Xiaoyong and Zhang, Qi and Beheshti, Amin and Fan, Wei}, booktitle = {Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI-25}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {James Kwok}, pages = {2694--2702}, year = {2025}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2025/300}, url = {https://doi.org/10.24963/ijcai.2025/300}, }