@article{
corrado2026onpolicy,
title={On-Policy Policy Gradient Reinforcement Learning Without On-Policy Sampling},
author={Nicholas E. Corrado and Josiah P. Hanna},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2026},
url={https://openreview.net/forum?id=nCoyFp8uO1},
note={}
}