Koki Saito, Akira Notsu, Seiki Ubukata, Katsuhiro Honda. Performance Investigation of UCB Policy in Q-learning. In 14th IEEE International Conference on Machine Learning and Applications, ICMLA 2015, Miami, FL, USA, December 9-11, 2015. pages 777-780, IEEE, 2015. [doi]
@inproceedings{SaitoNUH15, title = {Performance Investigation of UCB Policy in Q-learning}, author = {Koki Saito and Akira Notsu and Seiki Ubukata and Katsuhiro Honda}, year = {2015}, doi = {10.1109/ICMLA.2015.59}, url = {http://dx.doi.org/10.1109/ICMLA.2015.59}, researchr = {https://researchr.org/publication/SaitoNUH15}, cites = {0}, citedby = {0}, pages = {777-780}, booktitle = {14th IEEE International Conference on Machine Learning and Applications, ICMLA 2015, Miami, FL, USA, December 9-11, 2015}, publisher = {IEEE}, isbn = {978-1-5090-0287-0}, }