BibTeX
@inproceedings{2502, author = "Palenicek, D. and Vogt, F. and Watson, J. and Peters, J.", year = "submitted", title = "Scaling Off-Policy Reinforcement Learning with Batch and Weight Normalization", booktitle = "Under review", URL = "https://arxiv.org/pdf/2502.07523", crossref = "p11857" }