Stefan Elfwing, Eiji Uchibe, Kenji Doya. From free energy to expected energy: Improving energy-based value function approximation in reinforcement learning. Neural Networks, 84:17-27, 2016. [doi]
@article{ElfwingUD16, title = {From free energy to expected energy: Improving energy-based value function approximation in reinforcement learning}, author = {Stefan Elfwing and Eiji Uchibe and Kenji Doya}, year = {2016}, doi = {10.1016/j.neunet.2016.07.013}, url = {http://dx.doi.org/10.1016/j.neunet.2016.07.013}, researchr = {https://researchr.org/publication/ElfwingUD16}, cites = {0}, citedby = {0}, journal = {Neural Networks}, volume = {84}, pages = {17-27}, }