Manuel Loth, Philippe Preux, Manuel Davy. A unified view of TD algorithms, introducing Full-gradient TD and Equi-gradient descent TD. In ESANN 2007, 15th European Symposium on Artificial Neural Networks, Bruges, Belgium, April 25-27, 2007, Proceedings. pages 289-294, 2007. [doi]
@inproceedings{LothPD07, title = {A unified view of TD algorithms, introducing Full-gradient TD and Equi-gradient descent TD}, author = {Manuel Loth and Philippe Preux and Manuel Davy}, year = {2007}, url = {http://www.dice.ucl.ac.be/Proceedings/esann/esannpdf/es2007-93.pdf}, researchr = {https://researchr.org/publication/LothPD07}, cites = {0}, citedby = {0}, pages = {289-294}, booktitle = {ESANN 2007, 15th European Symposium on Artificial Neural Networks, Bruges, Belgium, April 25-27, 2007, Proceedings}, }