Update README.md
Browse files
README.md
CHANGED
|
@@ -1,5 +1,7 @@
|
|
| 1 |
---
|
| 2 |
-
base_model:
|
|
|
|
|
|
|
| 3 |
datasets: hf-cmu-collab/DeepScaleR-1.5B-Preview_on-policy_GRPO
|
| 4 |
library_name: transformers
|
| 5 |
model_name: DeepSeek-R1-Distill-Qwen-7B-GRPO
|
|
|
|
| 1 |
---
|
| 2 |
+
base_model:
|
| 3 |
+
- agentica-org/DeepScaleR-1.5B-Preview
|
| 4 |
+
- CohenQu/DeepSeek-R1-Distill-Qwen-7B-GRPO
|
| 5 |
datasets: hf-cmu-collab/DeepScaleR-1.5B-Preview_on-policy_GRPO
|
| 6 |
library_name: transformers
|
| 7 |
model_name: DeepSeek-R1-Distill-Qwen-7B-GRPO
|