@article{guo2025deepseek,4 title={Deepseek-r1: Incentivizing reasoning capability in llms via reinforcement learning}, author={Guo, Daya and Yang, Dejian and Zhang, Haowei and Song, Junxiao and Zhang, Ruoyu and Xu, Runxin and Zhu, Qihao and Ma, Shirong and Wang, Peiyi and Bi, Xiao and others}, journal={arXiv preprint arXiv:2501.12948}, year={2025} } @article{liu2024deepseek, title={Deepseek-v3 technical report}, author={Liu, Aixin and Feng, Bei and Xue, Bing and Wang, Bingxuan and Wu, Bochao and Lu, Chengda and Zhao, Chenggang and Deng, Chengqi and Zhang, Chenyu and Ruan, Chong and others}, journal={arXiv preprint arXiv:2412.19437}, year={2024} }