@inproceedings{ijcai2020p131, title = {Hierarchical Attention Based Spatial-Temporal Graph-to-Sequence Learning for Grounded Video Description}, author = {Shen, Kai and Wu, Lingfei and Xu, Fangli and Tang, Siliang and Xiao, Jun and Zhuang, Yueting}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI-20}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Christian Bessiere}, pages = {941--947}, year = {2020}, month = {7}, note = {Main track}, doi = {10.24963/ijcai.2020/131}, url = {https://doi.org/10.24963/ijcai.2020/131}, }