Back
A Nonparametric Off-Policy Policy Gradient
@conference{TosCarAbdPet20, title = {A Nonparametric Off-Policy Policy Gradient}, booktitle = {Proceedings of the 23rd International Conference on Artificial Intelligence and Statistics (AISTATS)}, volume = {108}, pages = {167--177}, series = {Proceedings of Machine Learning Research}, editors = {Silvia Chiappa and Roberto Calandra}, publisher = {PMLR}, month = aug, year = {2020}, slug = {toscarabdpet20}, author = {Tosatto, S. and Carvalho, J. and Abdulsamad, H. and Peters, J.}, month_numeric = {8} }
More information