BibTeX
@article{Tosatto_ITPAMI_2022, author = "Tosatto, S. and Carvalho, J. and Peters, J.", year = "2022", title = "Batch Reinforcement Learning with a Nonparametric Off-Policy Policy Gradient", booktitle = "IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)", URL = "https://ieeexplore.ieee.org/document/9449972", number = "10", pages = "5996--6010", crossref = "p11436" }