Theodore J. Perkins, Doina Precup. A Convergent Form of Approximate Policy Iteration. In Suzanna Becker, Sebastian Thrun, Klaus Obermayer, editors, Advances in Neural Information Processing Systems 15 [Neural Information Processing Systems, NIPS 2002, December 9-14, 2002, Vancouver, British Columbia, Canada]. pages 1595-1602, MIT Press, 2002. [doi]
@inproceedings{PerkinsP02, title = {A Convergent Form of Approximate Policy Iteration}, author = {Theodore J. Perkins and Doina Precup}, year = {2002}, url = {http://books.nips.cc/papers/files/nips15/CN11.pdf}, researchr = {https://researchr.org/publication/PerkinsP02}, cites = {0}, citedby = {0}, pages = {1595-1602}, booktitle = {Advances in Neural Information Processing Systems 15 [Neural Information Processing Systems, NIPS 2002, December 9-14, 2002, Vancouver, British Columbia, Canada]}, editor = {Suzanna Becker and Sebastian Thrun and Klaus Obermayer}, publisher = {MIT Press}, isbn = {0-262-02550-7}, }