BibTeX

@unpublished{Carvalho_MCRLDM_2022,
  author =		 "Carvalho, J. and  Peters, J.",
  year =		 "2022",
  title =		 "An Analysis of Measure-Valued Derivatives for Policy Gradients",
  booktitle =		 "Multi-disciplinary Conference on Reinforcement Learning and Decision Making (RLDM)",
  URL =			 "https://arxiv.org/pdf/2203.03917.pdf",
  crossref =		 "p11501"
}