Rommert Dekker, Arie Hordijk. Average, Sensitive and Blackwell Optimal Policies in Denumerable Markov Decision Chains with Unbounded Rewards. Math. Oper. Res., 13(3):395-420, 1988. [doi]
@article{DekkerH88, title = {Average, Sensitive and Blackwell Optimal Policies in Denumerable Markov Decision Chains with Unbounded Rewards}, author = {Rommert Dekker and Arie Hordijk}, year = {1988}, doi = {10.1287/moor.13.3.395}, url = {http://dx.doi.org/10.1287/moor.13.3.395}, researchr = {https://researchr.org/publication/DekkerH88}, cites = {0}, citedby = {0}, journal = {Math. Oper. Res.}, volume = {13}, number = {3}, pages = {395-420}, }