Jiajin Li, Baoxiang Wang, Shengyu Zhang. Policy Optimization with Second-Order Advantage Information. In Jérôme Lang, editor, Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, IJCAI 2018, July 13-19, 2018, Stockholm, Sweden. pages 5038-5044, ijcai.org, 2018. [doi]
@inproceedings{LiWZ18-5, title = {Policy Optimization with Second-Order Advantage Information}, author = {Jiajin Li and Baoxiang Wang and Shengyu Zhang}, year = {2018}, doi = {10.24963/ijcai.2018/699}, url = {https://doi.org/10.24963/ijcai.2018/699}, researchr = {https://researchr.org/publication/LiWZ18-5}, cites = {0}, citedby = {0}, pages = {5038-5044}, booktitle = {Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, IJCAI 2018, July 13-19, 2018, Stockholm, Sweden}, editor = {Jérôme Lang}, publisher = {ijcai.org}, isbn = {978-0-9992411-2-7}, }