reference. d1: Scaling reasoning in diffusion large language models via reinforcement learning [zhao2025d1]
reference. d1: Scaling reasoning in diffusion large language models via reinforcement learning [zhao2025d1]
@article{zhao2025d1, title = {d1: Scaling Reasoning in Diffusion Large Language Models via Reinforcement Learning}, author = {Zhao, Siyan and Gupta, Devaansh and Zheng, Qinqing and Grover, Aditya}, year = {2025}, journal = {arXiv preprint arXiv:2504.12216} }