Peter Vamplew, Rustam Issabekov, Richard Dazeley, Cameron Foale, Adam Berry, Tim Moore, Douglas C. Creighton. Steering approaches to Pareto-optimal multiobjective reinforcement learning. Neurocomputing, 263:26-38, 2017. [doi]
@article{VamplewIDFBMC17, title = {Steering approaches to Pareto-optimal multiobjective reinforcement learning}, author = {Peter Vamplew and Rustam Issabekov and Richard Dazeley and Cameron Foale and Adam Berry and Tim Moore and Douglas C. Creighton}, year = {2017}, doi = {10.1016/j.neucom.2016.08.152}, url = {https://doi.org/10.1016/j.neucom.2016.08.152}, researchr = {https://researchr.org/publication/VamplewIDFBMC17}, cites = {0}, citedby = {0}, journal = {Neurocomputing}, volume = {263}, pages = {26-38}, }