Serena Booth, W. Bradley Knox, Julie Shah, Scott Niekum, Peter Stone, Alessandro Allievi. The Perils of Trial-and-Error Reward Design: Misdesign through Overfitting and Invalid Task Specifications. In Brian Williams 0001, Yiling Chen 0001, Jennifer Neville, editors, Thirty-Seventh AAAI Conference on Artificial Intelligence, AAAI 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, IAAI 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, EAAI 2023, Washington, DC, USA, February 7-14, 2023. pages 5920-5929, AAAI Press, 2023. [doi]
@inproceedings{BoothKSNSA23, title = {The Perils of Trial-and-Error Reward Design: Misdesign through Overfitting and Invalid Task Specifications}, author = {Serena Booth and W. Bradley Knox and Julie Shah and Scott Niekum and Peter Stone and Alessandro Allievi}, year = {2023}, url = {https://ojs.aaai.org/index.php/AAAI/article/view/25733}, researchr = {https://researchr.org/publication/BoothKSNSA23}, cites = {0}, citedby = {0}, pages = {5920-5929}, booktitle = {Thirty-Seventh AAAI Conference on Artificial Intelligence, AAAI 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, IAAI 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, EAAI 2023, Washington, DC, USA, February 7-14, 2023}, editor = {Brian Williams 0001 and Yiling Chen 0001 and Jennifer Neville}, publisher = {AAAI Press}, isbn = {978-1-57735-880-0}, }