reference. Does reinforcement learning really incentivize reasoning capacity in LLMs beyond the base model? [yue2025does]
reference. Does reinforcement learning really incentivize reasoning capacity in LLMs beyond the base model? [yue2025does]
@article{yue2025does, title = {Does Reinforcement Learning Really Incentivize Reasoning Capacity in LLMs Beyond the Base Model?}, author = {Yue, Yang and Chen, Zhiqi and Lu, Rui and Zhao, Andrew and Wang, Zhaokai and Song, Shiji and Huang, Gao}, year = {2025}, journal = {arXiv preprint arXiv:2504.13837} }