BibTeX
@unpublished{Carvalho_MCRLDM_2022,
author = "Carvalho, J. and Peters, J.",
year = "2022",
title = "An Analysis of Measure-Valued Derivatives for Policy Gradients",
booktitle = "Multi-disciplinary Conference on Reinforcement Learning and Decision Making (RLDM)",
URL = "https://arxiv.org/pdf/2203.03917.pdf",
crossref = "p11501"
}