BibTeX
@article{LSD_revise_ver3_59040,
author = "Morimura, T. and Uchibe, E. and Yoshimoto, J. and Peters, J. and Doya, K.",
year = "2010",
title = "Derivatives of Logarithmic Stationary Distributions for Policy Gradient Reinforcement Learning",
booktitle = "Neural Computation",
URL = "https://www.ias.informatik.tu-darmstadt.de/uploads/Publications/Publications/LSD_revise_ver3_5904[0].pdf",
number = "2",
crossref = "p10297"
}