@inproceedings{ijcai2018p699, title = {Policy Optimization with Second-Order Advantage Information}, author = {Jiajin Li and Baoxiang Wang and Shengyu Zhang}, booktitle = {Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, {IJCAI-18}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, pages = {5038--5044}, year = {2018}, month = {7}, doi = {10.24963/ijcai.2018/699}, url = {https://doi.org/10.24963/ijcai.2018/699}, }