@inproceedings{Riedmiller_PIISADPRL_2007, author = "Riedmiller, M. and Peters, J. and Schaal, S.", year = "2007", title = "Evaluation of policy gradient methods and variants on the cart-pole benchmark", booktitle = "Proceedings of the 2007 IEEE International Symposium on Approximate Dynamic Programming and Reinforcement Learning", key = "reinforcement learning, cart-pole, policy gradient methods", URL = "https://www.ias.informatik.tu-darmstadt.de/uploads/Publications/Publications/ADPRL2007-Peters2_[0].pdf", crossref = "p2654" }