Gerald Tesauro. Temporal Difference Learning and TD-Gammon. Communications of the ACM, 38(3):58-68, 1995.
@article{Tesauro95, title = {Temporal Difference Learning and TD-Gammon}, author = {Gerald Tesauro}, year = {1995}, researchr = {https://researchr.org/publication/Tesauro95}, cites = {0}, citedby = {0}, journal = {Communications of the ACM}, volume = {38}, number = {3}, pages = {58-68}, }