Ehsan Imani, Eric Graves, Martha White. An Off-policy Policy Gradient Theorem Using Emphatic Weightings. In Samy Bengio, Hanna M. Wallach, Hugo Larochelle, Kristen Grauman, Nicolò Cesa-Bianchi, Roman Garnett, editors, Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, 3-8 December 2018, Montréal, Canada. pages 96-106, 2018. [doi]
@inproceedings{ImaniGW18, title = {An Off-policy Policy Gradient Theorem Using Emphatic Weightings}, author = {Ehsan Imani and Eric Graves and Martha White}, year = {2018}, url = {http://papers.nips.cc/paper/7295-an-off-policy-policy-gradient-theorem-using-emphatic-weightings}, researchr = {https://researchr.org/publication/ImaniGW18}, cites = {0}, citedby = {0}, pages = {96-106}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, 3-8 December 2018, Montréal, Canada}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicolò Cesa-Bianchi and Roman Garnett}, }