Ximing Liu, Tianqing Zhu, Cuiqing Jiang, Dayong Ye, Fuqing Zhao. Prioritized Experience Replay based on Multi-armed Bandit. Expert Syst. Appl., 189:116023, 2022. [doi]
@article{LiuZJYZ22, title = {Prioritized Experience Replay based on Multi-armed Bandit}, author = {Ximing Liu and Tianqing Zhu and Cuiqing Jiang and Dayong Ye and Fuqing Zhao}, year = {2022}, doi = {10.1016/j.eswa.2021.116023}, url = {https://doi.org/10.1016/j.eswa.2021.116023}, researchr = {https://researchr.org/publication/LiuZJYZ22}, cites = {0}, citedby = {0}, journal = {Expert Syst. Appl.}, volume = {189}, pages = {116023}, }