mirror of
https://github.com/deepseek-ai/DeepSeek-R1.git
synced 2025-04-29 02:19:22 +00:00
Merge 6a023be7cfe1b13d8261d335e04ddb1eef84b5ca into 95aaec702f4bf183e18da90545e26c094cedcf6d
This commit is contained in:
commit
861659d640
@ -261,7 +261,7 @@ DeepSeek-R1 series support commercial use, allow for any modifications and deriv
|
|||||||
- DeepSeek-R1-Distill-Llama-70B is derived from Llama3.3-70B-Instruct and is originally licensed under [llama3.3 license](https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct/blob/main/LICENSE).
|
- DeepSeek-R1-Distill-Llama-70B is derived from Llama3.3-70B-Instruct and is originally licensed under [llama3.3 license](https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct/blob/main/LICENSE).
|
||||||
|
|
||||||
## 8. Citation
|
## 8. Citation
|
||||||
```
|
```bibtex
|
||||||
@misc{deepseekai2025deepseekr1incentivizingreasoningcapability,
|
@misc{deepseekai2025deepseekr1incentivizingreasoningcapability,
|
||||||
title={DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning},
|
title={DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning},
|
||||||
author={DeepSeek-AI},
|
author={DeepSeek-AI},
|
||||||
|
Loading…
x
Reference in New Issue
Block a user