Kaddour Najim, Alexander S. Poznyak, E. Gomez. Adaptive policy for two finite Markov chains zero-sum stochastic game with unknown transition matrices and average payoffs. Automatica, 37(7):1007-1018, 2001. [doi]
@article{NajimPG01, title = {Adaptive policy for two finite Markov chains zero-sum stochastic game with unknown transition matrices and average payoffs}, author = {Kaddour Najim and Alexander S. Poznyak and E. Gomez}, year = {2001}, doi = {10.1016/S0005-1098(01)00050-4}, url = {http://dx.doi.org/10.1016/S0005-1098(01)00050-4}, tags = {e-science, Markov}, researchr = {https://researchr.org/publication/NajimPG01}, cites = {0}, citedby = {0}, journal = {Automatica}, volume = {37}, number = {7}, pages = {1007-1018}, }