Bahare Kiumarsi, Frank L. Lewis, Hamidreza Modares, Ali Karimpour, Mohammad-Bagher Naghibi Sistani. Reinforcement Q-learning for optimal tracking control of linear discrete-time systems with unknown dynamics. Automatica, 50(4):1167-1175, 2014. [doi]
@article{KiumarsiLMKS14, title = {Reinforcement Q-learning for optimal tracking control of linear discrete-time systems with unknown dynamics}, author = {Bahare Kiumarsi and Frank L. Lewis and Hamidreza Modares and Ali Karimpour and Mohammad-Bagher Naghibi Sistani}, year = {2014}, doi = {10.1016/j.automatica.2014.02.015}, url = {http://dx.doi.org/10.1016/j.automatica.2014.02.015}, researchr = {https://researchr.org/publication/KiumarsiLMKS14}, cites = {0}, citedby = {0}, journal = {Automatica}, volume = {50}, number = {4}, pages = {1167-1175}, }