@inproceedings{AIStats2009Hoffman_5658, author = "Hoffman, M. and de Freitas, N. and Doucet, A. and Peters, J.", year = "2009", title = "An Expectation Maximization Algorithm for Continuous Markov Decision Processes with Arbitrary Reward", booktitle = "Proceedings of the Twelfth International Conference on Artificial Intelligence and Statistics (AIStats)", URL = "https://www.ias.informatik.tu-darmstadt.de/uploads/Publications/Publications/AIStats2009-Hoffman_5658.pdf", crossref = "p10204" }