Chris Reinke, Eiji Uchibe, Kenji Doya. Average Reward Optimization with Multiple Discounting Reinforcement Learners. In Derong Liu, Shengli Xie, Yuanqing Li, Dongbin Zhao, El-Sayed M. El-Alfy, editors, Neural Information Processing - 24th International Conference, ICONIP 2017, Guangzhou, China, November 14-18, 2017, Proceedings, Part I. Volume 10634 of Lecture Notes in Computer Science, pages 789-800, Springer, 2017. [doi]
@inproceedings{ReinkeUD17, title = {Average Reward Optimization with Multiple Discounting Reinforcement Learners}, author = {Chris Reinke and Eiji Uchibe and Kenji Doya}, year = {2017}, doi = {10.1007/978-3-319-70087-8_81}, url = {https://doi.org/10.1007/978-3-319-70087-8_81}, researchr = {https://researchr.org/publication/ReinkeUD17}, cites = {0}, citedby = {0}, pages = {789-800}, booktitle = {Neural Information Processing - 24th International Conference, ICONIP 2017, Guangzhou, China, November 14-18, 2017, Proceedings, Part I}, editor = {Derong Liu and Shengli Xie and Yuanqing Li and Dongbin Zhao and El-Sayed M. El-Alfy}, volume = {10634}, series = {Lecture Notes in Computer Science}, publisher = {Springer}, isbn = {978-3-319-70087-8}, }