Hyeong Soo Chang, Jiaqiao Hu, Michael C. Fu, Steven I. Marcus. Adaptive Adversarial Multi-Armed Bandit Approach to Two-Person Zero-Sum Markov Games. IEEE Trans. Automat. Contr., 55(2):463-468, 2010. [doi]
@article{ChangHFM10, title = {Adaptive Adversarial Multi-Armed Bandit Approach to Two-Person Zero-Sum Markov Games}, author = {Hyeong Soo Chang and Jiaqiao Hu and Michael C. Fu and Steven I. Marcus}, year = {2010}, doi = {10.1109/TAC.2009.2036333}, url = {http://dx.doi.org/10.1109/TAC.2009.2036333}, researchr = {https://researchr.org/publication/ChangHFM10}, cites = {0}, citedby = {0}, journal = {IEEE Trans. Automat. Contr.}, volume = {55}, number = {2}, pages = {463-468}, }