Amber Srivastava, Srinivasa M. Salapaka. Parameterized MDPs and Reinforcement Learning Problems - A Maximum Entropy Principle-Based Framework. IEEE T. Cybernetics, 52(9):9339-9351, 2022. [doi]
@article{SrivastavaS22-1, title = {Parameterized MDPs and Reinforcement Learning Problems - A Maximum Entropy Principle-Based Framework}, author = {Amber Srivastava and Srinivasa M. Salapaka}, year = {2022}, doi = {10.1109/TCYB.2021.3102510}, url = {https://doi.org/10.1109/TCYB.2021.3102510}, researchr = {https://researchr.org/publication/SrivastavaS22-1}, cites = {0}, citedby = {0}, journal = {IEEE T. Cybernetics}, volume = {52}, number = {9}, pages = {9339-9351}, }