Stéphane Ross, Geoffrey J. Gordon, Drew Bagnell. A Reduction of Imitation Learning and Structured Prediction to No-Regret Online Learning. Journal of Machine Learning Research, 15:627-635, 2011. [doi]
@article{RossGB11, title = {A Reduction of Imitation Learning and Structured Prediction to No-Regret Online Learning}, author = {Stéphane Ross and Geoffrey J. Gordon and Drew Bagnell}, year = {2011}, url = {http://www.jmlr.org/proceedings/papers/v15/ross11a/ross11a.pdf}, researchr = {https://researchr.org/publication/RossGB11}, cites = {0}, citedby = {0}, journal = {Journal of Machine Learning Research}, volume = {15}, pages = {627-635}, }