Manuela Ruiz-Montiel, Lawrence Mandow, José-Luis Pérez-de-la-Cruz. A temporal difference method for multi-objective reinforcement learning. Neurocomputing, 263:15-25, 2017. [doi]
@article{Ruiz-MontielMP17, title = {A temporal difference method for multi-objective reinforcement learning}, author = {Manuela Ruiz-Montiel and Lawrence Mandow and José-Luis Pérez-de-la-Cruz}, year = {2017}, doi = {10.1016/j.neucom.2016.10.100}, url = {https://doi.org/10.1016/j.neucom.2016.10.100}, researchr = {https://researchr.org/publication/Ruiz-MontielMP17}, cites = {0}, citedby = {0}, journal = {Neurocomputing}, volume = {263}, pages = {15-25}, }