Shicong Cen, Chen Cheng, Yuxin Chen 0002, Yuting Wei, Yuejie Chi. Fast Global Convergence of Natural Policy Gradient Methods with Entropy Regularization. Operations Research, 70(4):2563-2578, 2022. [doi]
@article{CenCCWC22, title = {Fast Global Convergence of Natural Policy Gradient Methods with Entropy Regularization}, author = {Shicong Cen and Chen Cheng and Yuxin Chen 0002 and Yuting Wei and Yuejie Chi}, year = {2022}, doi = {10.1287/opre.2021.2151}, url = {https://doi.org/10.1287/opre.2021.2151}, researchr = {https://researchr.org/publication/CenCCWC22}, cites = {0}, citedby = {0}, journal = {Operations Research}, volume = {70}, number = {4}, pages = {2563-2578}, }