Qiang He, Xinwen Hou, Yu Liu. POPO: Pessimistic Offline Policy Optimization. In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022. pages 4008-4012, IEEE, 2022. [doi]
@inproceedings{HeHL22-0, title = {POPO: Pessimistic Offline Policy Optimization}, author = {Qiang He and Xinwen Hou and Yu Liu}, year = {2022}, doi = {10.1109/ICASSP43922.2022.9747886}, url = {https://doi.org/10.1109/ICASSP43922.2022.9747886}, researchr = {https://researchr.org/publication/HeHL22-0}, cites = {0}, citedby = {0}, pages = {4008-4012}, booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022}, publisher = {IEEE}, isbn = {978-1-6654-0540-9}, }