Benjamin Van Roy. Learning and value function approximation in complex decision processes. PhD thesis, Massachusetts Institute of Technology, Cambridge, MA, USA, 1998. [doi]
@phdthesis{ndltd-1930, title = {Learning and value function approximation in complex decision processes}, author = {Benjamin Van Roy}, year = {1998}, url = {http://hdl.handle.net/1721.1/9960}, note = {ndltd.org (oai:dspace.mit.edu:1721.1/9960)}, researchr = {https://researchr.org/publication/ndltd-1930}, cites = {0}, citedby = {0}, school = {Massachusetts Institute of Technology, Cambridge, MA, USA}, }