Frédérick Garcia, Florent Serre. From Q(lambda) to Average Q-learning: Efficient Implementation of an Asymptotic Approximation. In Bernhard Nebel, editor, Proceedings of the Seventeenth International Joint Conference on Artificial Intelligence, IJCAI 2001, Seattle, Washington, USA, August 4-10, 2001. pages 959-964, Morgan Kaufmann, 2001.
@inproceedings{GarciaS01:1, title = {From Q(lambda) to Average Q-learning: Efficient Implementation of an Asymptotic Approximation}, author = {Frédérick Garcia and Florent Serre}, year = {2001}, researchr = {https://researchr.org/publication/GarciaS01%3A1}, cites = {0}, citedby = {0}, pages = {959-964}, booktitle = {Proceedings of the Seventeenth International Joint Conference on Artificial Intelligence, IJCAI 2001, Seattle, Washington, USA, August 4-10, 2001}, editor = {Bernhard Nebel}, publisher = {Morgan Kaufmann}, isbn = {1-55860-777-3}, }