Vivek S. Borkar, Siddharth Chandak. Prospect-theoretic Q-learning. Systems & Control Letters, 156:105009, 2021. [doi]
@article{BorkarC21, title = {Prospect-theoretic Q-learning}, author = {Vivek S. Borkar and Siddharth Chandak}, year = {2021}, doi = {10.1016/j.sysconle.2021.105009}, url = {https://doi.org/10.1016/j.sysconle.2021.105009}, researchr = {https://researchr.org/publication/BorkarC21}, cites = {0}, citedby = {0}, journal = {Systems & Control Letters}, volume = {156}, pages = {105009}, }