@inproceedings{ijcai2019p625, title = {Exploiting the Sign of the Advantage Function to Learn Deterministic Policies in Continuous Domains}, author = {Zimmer, Matthieu and Weng, Paul}, booktitle = {Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, {IJCAI-19}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, pages = {4496--4502}, year = {2019}, month = {7}, doi = {10.24963/ijcai.2019/625}, url = {https://doi.org/10.24963/ijcai.2019/625}, }