Obtaining accurate estimated action values in categorical distributional reinforcement learning

Yingnan Zhao, Peng Liu 0008, Chenjia Bai, Wei Zhao 0008, Xianglong Tang. Obtaining accurate estimated action values in categorical distributional reinforcement learning. Knowl.-Based Syst., 194:105511, 2020. [doi]

@article{ZhaoLBZT20,
  title = {Obtaining accurate estimated action values in categorical distributional reinforcement learning},
  author = {Yingnan Zhao and Peng Liu 0008 and Chenjia Bai and Wei Zhao 0008 and Xianglong Tang},
  year = {2020},
  doi = {10.1016/j.knosys.2020.105511},
  url = {https://doi.org/10.1016/j.knosys.2020.105511},
  researchr = {https://researchr.org/publication/ZhaoLBZT20},
  cites = {0},
  citedby = {0},
  journal = {Knowl.-Based Syst.},
  volume = {194},
  pages = {105511},
}