reference. d1: Scaling reasoning in diffusion large language models via reinforcement learning [zhao2025d1]
reference. d1: Scaling reasoning in diffusion large language models via reinforcement learning [zhao2025d1]
@article{zhao2025d1,
title = {d1: Scaling Reasoning in Diffusion Large Language Models via Reinforcement Learning},
author = {Zhao, Siyan and Gupta, Devaansh and Zheng, Qinqing and Grover, Aditya},
year = {2025},
journal = {arXiv preprint arXiv:2504.12216}
}