@inproceedings{ijcai2021p154, title = {Dig into Multi-modal Cues for Video Retrieval with Hierarchical Alignment}, author = {Wang, Wenzhe and Zhang, Mengdan and Chen, Runnan and Cai, Guanyu and Zhou, Penghao and Peng, Pai and Guo, Xiaowei and Wu, Jian and Sun, Xing}, booktitle = {Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence, {IJCAI-21}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Zhi-Hua Zhou}, pages = {1113--1121}, year = {2021}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2021/154}, url = {https://doi.org/10.24963/ijcai.2021/154}, }