Pessimistic value iteration for multi-task data sharing in Offline Reinforcement Learning

Chenjia Bai, Lingxiao Wang 0003, Jianye Hao, Zhuoran Yang, Bin Zhao 0001, Zhen Wang, Xuelong Li 0001. Pessimistic value iteration for multi-task data sharing in Offline Reinforcement Learning. Artificial Intelligence, 326:104048, January 2024. [doi]

@article{BaiWHYZWL24,
  title = {Pessimistic value iteration for multi-task data sharing in Offline Reinforcement Learning},
  author = {Chenjia Bai and Lingxiao Wang 0003 and Jianye Hao and Zhuoran Yang and Bin Zhao 0001 and Zhen Wang and Xuelong Li 0001},
  year = {2024},
  month = {January},
  doi = {10.1016/j.artint.2023.104048},
  url = {https://doi.org/10.1016/j.artint.2023.104048},
  researchr = {https://researchr.org/publication/BaiWHYZWL24},
  cites = {0},
  citedby = {0},
  journal = {Artificial Intelligence},
  volume = {326},
  pages = {104048},
}