BibTeX

@article{Tosatto_ITPAMI_2022,
  author =		 "Tosatto, S. and  Carvalho, J. and  Peters, J.",
  year =		 "2022",
  title =		 "Batch Reinforcement Learning with a Nonparametric Off-Policy Policy Gradient",
  booktitle =		 "IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)",
  URL =			 "https://ieeexplore.ieee.org/document/9449972",
  number =		 "10",
  pages =		 "5996--6010",
  crossref =		 "p11436"
}