Ching-An Cheng, Remi Tachet des Combes, Byron Boots, Geoffrey J. Gordon. A Reduction from Reinforcement Learning to No-Regret Online Learning. In Silvia Chiappa, Roberto Calandra, editors, The 23rd International Conference on Artificial Intelligence and Statistics, AISTATS 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]. Volume 108 of Proceedings of Machine Learning Research, pages 3514-3524, PMLR, 2020. [doi]
@inproceedings{ChengCBG20, title = {A Reduction from Reinforcement Learning to No-Regret Online Learning}, author = {Ching-An Cheng and Remi Tachet des Combes and Byron Boots and Geoffrey J. Gordon}, year = {2020}, url = {http://proceedings.mlr.press/v108/cheng20b.html}, researchr = {https://researchr.org/publication/ChengCBG20}, cites = {0}, citedby = {0}, pages = {3514-3524}, booktitle = {The 23rd International Conference on Artificial Intelligence and Statistics, AISTATS 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]}, editor = {Silvia Chiappa and Roberto Calandra}, volume = {108}, series = {Proceedings of Machine Learning Research}, publisher = {PMLR}, }