Tuning continual exploration in reinforcement learning: An optimality property of the Boltzmann strategy

Youssef Achbany, François Fouss, Luh Yen, Alain Pirotte, Marco Saerens. Tuning continual exploration in reinforcement learning: An optimality property of the Boltzmann strategy. Neurocomputing, 71(13-15):2507-2520, 2008. [doi]

@article{AchbanyFYPS08,
  title = {Tuning continual exploration in reinforcement learning: An optimality property of the Boltzmann strategy},
  author = {Youssef Achbany and François Fouss and Luh Yen and Alain Pirotte and Marco Saerens},
  year = {2008},
  doi = {10.1016/j.neucom.2007.11.040},
  url = {http://dx.doi.org/10.1016/j.neucom.2007.11.040},
  researchr = {https://researchr.org/publication/AchbanyFYPS08},
  cites = {0},
  citedby = {0},
  journal = {Neurocomputing},
  volume = {71},
  number = {13-15},
  pages = {2507-2520},
}