Reinforcement Q-learning for optimal tracking control of linear discrete-time systems with unknown dynamics

Bahare Kiumarsi, Frank L. Lewis, Hamidreza Modares, Ali Karimpour, Mohammad-Bagher Naghibi Sistani. Reinforcement Q-learning for optimal tracking control of linear discrete-time systems with unknown dynamics. Automatica, 50(4):1167-1175, 2014. [doi]

@article{KiumarsiLMKS14,
  title = {Reinforcement Q-learning for optimal tracking control of linear discrete-time systems with unknown dynamics},
  author = {Bahare Kiumarsi and Frank L. Lewis and Hamidreza Modares and Ali Karimpour and Mohammad-Bagher Naghibi Sistani},
  year = {2014},
  doi = {10.1016/j.automatica.2014.02.015},
  url = {http://dx.doi.org/10.1016/j.automatica.2014.02.015},
  researchr = {https://researchr.org/publication/KiumarsiLMKS14},
  cites = {0},
  citedby = {0},
  journal = {Automatica},
  volume = {50},
  number = {4},
  pages = {1167-1175},
}