@article{
markgraf2026safe,
title={Safe Reinforcement Learning using Action Projection: Safeguard the Policy or the Environment?},
author={Hannah Markgraf and Shambhuraj Sawant and Hanna Krasowski and Lukas Sch{\"a}fer and Sebastien Gros and Matthias Althoff},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2026},
url={https://openreview.net/forum?id=DDrGSEYxGU},
note={Expert Certification}
}