reference. Does reinforcement learning really incentivize reasoning capacity in LLMs beyond the base model? [yue2025does]
✍️source

2025
Yang Yue, Zhiqi Chen, Rui Lu, Andrew Zhao, Zhaokai Wang, Shiji Song, Gao Huang

@article{yue2025does,
 title = {Does Reinforcement Learning Really Incentivize Reasoning Capacity in LLMs Beyond the Base Model?},
 author = {Yue, Yang and Chen, Zhiqi and Lu, Rui and Zhao, Andrew and Wang, Zhaokai and Song, Shiji and Huang, Gao},
 year = {2025},
 journal = {arXiv preprint arXiv:2504.13837}
}