Chen Tessler, Daniel J. Mankowitz, Shie Mannor. Reward Constrained Policy Optimization. In 7th International Conference on Learning Representations, ICLR 2019, New Orleans, LA, USA, May 6-9, 2019. OpenReview.net, 2019. [doi]
@inproceedings{TesslerMM19,
title = {Reward Constrained Policy Optimization},
author = {Chen Tessler and Daniel J. Mankowitz and Shie Mannor},
year = {2019},
url = {https://openreview.net/forum?id=SkfrvsA9FX},
researchr = {https://researchr.org/publication/TesslerMM19},
cites = {0},
citedby = {0},
booktitle = {7th International Conference on Learning Representations, ICLR 2019, New Orleans, LA, USA, May 6-9, 2019},
publisher = {OpenReview.net},
}