Douglas Aberdeen, Jonathan Baxter. Scalable Internal-State Policy-Gradient Methods for POMDPs. In Claude Sammut, Achim G. Hoffmann, editors, Machine Learning, Proceedings of the Nineteenth International Conference (ICML 2002), University of New South Wales, Sydney, Australia, July 8-12, 2002. pages 3-10, Morgan Kaufmann, 2002.
@inproceedings{AberdeenB02, title = {Scalable Internal-State Policy-Gradient Methods for POMDPs}, author = {Douglas Aberdeen and Jonathan Baxter}, year = {2002}, researchr = {https://researchr.org/publication/AberdeenB02}, cites = {0}, citedby = {0}, pages = {3-10}, booktitle = {Machine Learning, Proceedings of the Nineteenth International Conference (ICML 2002), University of New South Wales, Sydney, Australia, July 8-12, 2002}, editor = {Claude Sammut and Achim G. Hoffmann}, publisher = {Morgan Kaufmann}, isbn = {1-55860-873-7}, }