Peter Vamplew, Richard Dazeley, Cameron Foale. Softmax exploration strategies for multiobjective reinforcement learning. Neurocomputing, 263:74-86, 2017. [doi]
@article{VamplewDF17,
title = {Softmax exploration strategies for multiobjective reinforcement learning},
author = {Peter Vamplew and Richard Dazeley and Cameron Foale},
year = {2017},
doi = {10.1016/j.neucom.2016.09.141},
url = {https://doi.org/10.1016/j.neucom.2016.09.141},
researchr = {https://researchr.org/publication/VamplewDF17},
cites = {0},
citedby = {0},
journal = {Neurocomputing},
volume = {263},
pages = {74-86},
}