@inproceedings{ijcai2020p391, title = {BRPO: Batch Residual Policy Optimization}, author = {Sohn, Sungryull and Chow, Yinlam and Ooi, Jayden and Nachum, Ofir and Lee, Honglak and Chi, Ed and Boutilier, Craig}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI-20}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Christian Bessiere}, pages = {2824--2830}, year = {2020}, month = {7}, note = {Main track}, doi = {10.24963/ijcai.2020/391}, url = {https://doi.org/10.24963/ijcai.2020/391}, }