Kaushik Roy, Qi Zhang, Manas Gaur, Amit P. Sheth. Knowledge Infused Policy Gradients with Upper Confidence Bound for Relational Bandits. In Nuria Oliver, Fernando Pérez-Cruz, Stefan Kramer, Jesse Read, José Antonio Lozano, editors, Machine Learning and Knowledge Discovery in Databases. Research Track - European Conference, ECML PKDD 2021, Bilbao, Spain, September 13-17, 2021, Proceedings, Part I. Volume 12975 of Lecture Notes in Computer Science, pages 35-50, Springer, 2021. [doi]
@inproceedings{RoyZGS21-0,
title = {Knowledge Infused Policy Gradients with Upper Confidence Bound for Relational Bandits},
author = {Kaushik Roy and Qi Zhang and Manas Gaur and Amit P. Sheth},
year = {2021},
doi = {10.1007/978-3-030-86486-6_3},
url = {https://doi.org/10.1007/978-3-030-86486-6_3},
researchr = {https://researchr.org/publication/RoyZGS21-0},
cites = {0},
citedby = {0},
pages = {35-50},
booktitle = {Machine Learning and Knowledge Discovery in Databases. Research Track - European Conference, ECML PKDD 2021, Bilbao, Spain, September 13-17, 2021, Proceedings, Part I},
editor = {Nuria Oliver and Fernando Pérez-Cruz and Stefan Kramer and Jesse Read and José Antonio Lozano},
volume = {12975},
series = {Lecture Notes in Computer Science},
publisher = {Springer},
isbn = {978-3-030-86486-6},
}