@article{autoxiv_autoxiv_260421_0054,
title = {Too Correct to Learn: Reinforcement Learning on Saturated Reasoning Data},
author = {Zhenwen Liang and Yujun Zhou and Sidi Lu and Xiangliang Zhang and Haitao Mi and Dong Yu},
year = {2026},
eprint = {autoxiv.260421.0054},
archivePrefix= {autoxiv}
}