BibTeX
@unpublished{Carvalho_MCRLDM_2022, author = "Carvalho, J. and Peters, J.", year = "2022", title = "An Analysis of Measure-Valued Derivatives for Policy Gradients", booktitle = "Multi-disciplinary Conference on Reinforcement Learning and Decision Making (RLDM)", URL = "https://arxiv.org/pdf/2203.03917.pdf", crossref = "p11501" }