BibTeX
@article{Tosatto_ITPAMI_2022,
author = "Tosatto, S. and Carvalho, J. and Peters, J.",
year = "2022",
title = "Batch Reinforcement Learning with a Nonparametric Off-Policy Policy Gradient",
booktitle = "IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)",
URL = "https://ieeexplore.ieee.org/document/9449972",
number = "10",
pages = "5996--6010",
crossref = "p11436"
}