@article{autoxiv_autoxiv_260421_0074,
title = {Learning from Less: Measuring the Effectiveness of RLVR in Low Data and Compute Regimes},
author = {Justin Bauer and Thomas Walshe and Derek Pham and Harit Vishwakarma and Armin Parchami and Frederic Sala and Paroma Varma},
year = {2026},
eprint = {autoxiv.260421.0074},
archivePrefix= {autoxiv}
}