@inproceedings{ijcai2021p154,
  title     = {Dig into Multi-modal Cues for Video Retrieval with Hierarchical Alignment},
  author    = {Wang, Wenzhe and Zhang, Mengdan and Chen, Runnan and Cai, Guanyu and Zhou, Penghao and Peng, Pai and Guo, Xiaowei and Wu, Jian and Sun, Xing},
  booktitle = {Proceedings of the Thirtieth International Joint Conference on
               Artificial Intelligence, {IJCAI-21}},
  publisher = {International Joint Conferences on Artificial Intelligence Organization},
  editor    = {Zhi-Hua Zhou},
  pages     = {1113--1121},
  year      = {2021},
  month     = {8},
  note      = {Main Track},
  doi       = {10.24963/ijcai.2021/154},
  url       = {https://doi.org/10.24963/ijcai.2021/154},
}