Ronald Ortner, Daniil Ryabko, Peter Auer, Rémi Munos. Regret bounds for restless Markov bandits. Theoretical Computer Science, 558:62-76, 2014. [doi]
@article{OrtnerRAM14, title = {Regret bounds for restless Markov bandits}, author = {Ronald Ortner and Daniil Ryabko and Peter Auer and Rémi Munos}, year = {2014}, doi = {10.1016/j.tcs.2014.09.026}, url = {http://dx.doi.org/10.1016/j.tcs.2014.09.026}, researchr = {https://researchr.org/publication/OrtnerRAM14}, cites = {0}, citedby = {0}, journal = {Theoretical Computer Science}, volume = {558}, pages = {62-76}, }