BibTeX
@inproceedings{Peters_ICAPS_2007, author = "Peters, J. and Theodorou, E. and Schaal, S.", year = "2007", title = "Policy gradient methods for machine learning", booktitle = "INFORMS Conference of the Applied Probability Society", key = "policy gradient methods, reinforcement learning, simulation-optimization", crossref = "p2674" }