Ronald Ortner. Online regret bounds for Markov decision processes with deterministic transitions. Theoretical Computer Science, 411(29-30):2684-2695, 2010. [doi]
@article{Ortner10-0, title = {Online regret bounds for Markov decision processes with deterministic transitions}, author = {Ronald Ortner}, year = {2010}, doi = {10.1016/j.tcs.2010.04.005}, url = {http://dx.doi.org/10.1016/j.tcs.2010.04.005}, tags = {Markov}, researchr = {https://researchr.org/publication/Ortner10-0}, cites = {0}, citedby = {0}, journal = {Theoretical Computer Science}, volume = {411}, number = {29-30}, pages = {2684-2695}, }