@inproceedings{ijcai2021p385, title = {Average-Reward Reinforcement Learning with Trust Region Methods}, author = {Ma, Xiaoteng and Tang, Xiaohang and Xia, Li and Yang, Jun and Zhao, Qianchuan}, booktitle = {Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence, {IJCAI-21}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Zhi-Hua Zhou}, pages = {2797--2803}, year = {2021}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2021/385}, url = {https://doi.org/10.24963/ijcai.2021/385}, }