Ling Pan, Qingpeng Cai, Longbo Huang. Exploration in policy optimization through multiple paths. Autonomous Agents and Multi-Agent Systems, 35(2):33, 2021. [doi]
@article{PanCH21, title = {Exploration in policy optimization through multiple paths}, author = {Ling Pan and Qingpeng Cai and Longbo Huang}, year = {2021}, doi = {10.1007/s10458-021-09518-6}, url = {https://doi.org/10.1007/s10458-021-09518-6}, researchr = {https://researchr.org/publication/PanCH21}, cites = {0}, citedby = {0}, journal = {Autonomous Agents and Multi-Agent Systems}, volume = {35}, number = {2}, pages = {33}, }