Lingxiao Wang, Qi Cai, Zhuoran Yang, Zhaoran Wang. Neural Policy Gradient Methods: Global Optimality and Rates of Convergence. In 8th International Conference on Learning Representations, ICLR 2020, Addis Ababa, Ethiopia, April 26-30, 2020. OpenReview.net, 2020. [doi]
@inproceedings{WangCYW20, title = {Neural Policy Gradient Methods: Global Optimality and Rates of Convergence}, author = {Lingxiao Wang and Qi Cai and Zhuoran Yang and Zhaoran Wang}, year = {2020}, url = {https://openreview.net/forum?id=BJgQfkSYDS}, researchr = {https://researchr.org/publication/WangCYW20}, cites = {0}, citedby = {0}, booktitle = {8th International Conference on Learning Representations, ICLR 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, }