Seyed Kamyar Seyed Ghasemipour, Dale Schuurmans, Shixiang Shane Gu. EMaQ: Expected-Max Q-Learning Operator for Simple Yet Effective Offline and Online RL. In Marina Meila, Tong Zhang 0001, editors, Proceedings of the 38th International Conference on Machine Learning, ICML 2021, 18-24 July 2021, Virtual Event. Volume 139 of Proceedings of Machine Learning Research, pages 3682-3691, PMLR, 2021. [doi]
@inproceedings{GhasemipourSG21, title = {EMaQ: Expected-Max Q-Learning Operator for Simple Yet Effective Offline and Online RL}, author = {Seyed Kamyar Seyed Ghasemipour and Dale Schuurmans and Shixiang Shane Gu}, year = {2021}, url = {http://proceedings.mlr.press/v139/ghasemipour21a.html}, researchr = {https://researchr.org/publication/GhasemipourSG21}, cites = {0}, citedby = {0}, pages = {3682-3691}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, ICML 2021, 18-24 July 2021, Virtual Event}, editor = {Marina Meila and Tong Zhang 0001}, volume = {139}, series = {Proceedings of Machine Learning Research}, publisher = {PMLR}, }