BibTeX

SELECT * FROM publications WHERE Record_Number=11316
@inproceedings{tosatto2020,
  author =		 "Tosatto, S. and  Carvalho, J. and  Abdulsamad, H. and  Peters, J.",
  year =		 "2020",
  title =		 "A Nonparametric Off-Policy Policy Gradient",
  booktitle =		 "Proceedings of the 23rd International Conference on Artificial Intelligence and Statistics (AISTATS)",
  key =			 "nonparametric, policy gradient, off policy, reinforcement learning",
  URL =			 "https://www.ias.informatik.tu-darmstadt.de/uploads/Team/SamueleTosatto/tosatto2020.pdf",
  crossref =		 "p11316"
}

  

zum Seitenanfang