reference. Does reinforcement learning really incentivize reasoning capacity in LLMs beyond the base model? [yue2025does]
reference. Does reinforcement learning really incentivize reasoning capacity in LLMs beyond the base model? [yue2025does]
@article{yue2025does,
title = {Does Reinforcement Learning Really Incentivize Reasoning Capacity in LLMs Beyond the Base Model?},
author = {Yue, Yang and Chen, Zhiqi and Lu, Rui and Zhao, Andrew and Wang, Zhaokai and Song, Shiji and Huang, Gao},
year = {2025},
journal = {arXiv preprint arXiv:2504.13837}
}