@article{
pich{\'e}2026pipelinerl,
title={Pipeline{RL}: Faster On-policy Reinforcement Learning for Long Sequence Generation},
author={Alexandre Pich{\'e} and Ehsan Kamalloo and Rafael Pardinas and Xiaoyin Chen and Dzmitry Bahdanau},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2026},
url={https://openreview.net/forum?id=A35ak14Cyp},
note={}
}