Marcus Hutter, Shane Legg. Temporal Difference Updating without a Learning Rate. In John C. Platt, Daphne Koller, Yoram Singer, Sam T. Roweis, editors, Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007. pages 705-712, MIT Press, 2007. [doi]
@inproceedings{HutterL07,
title = {Temporal Difference Updating without a Learning Rate},
author = {Marcus Hutter and Shane Legg},
year = {2007},
url = {http://books.nips.cc/papers/files/nips20/NIPS2007_0514.pdf},
researchr = {https://researchr.org/publication/HutterL07},
cites = {0},
citedby = {0},
pages = {705-712},
booktitle = {Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
editor = {John C. Platt and Daphne Koller and Yoram Singer and Sam T. Roweis},
publisher = {MIT Press},
}