Spaces:
Running
Running
Update submission.json with dpo
Browse fileshf jobs uv run \
--flavor a10g-large \
--timeout 2h \
--with "lighteval[vllm]@git+https://github.com/huggingface/lighteval,emoji" \
--secrets HF_TOKEN \
lighteval vllm "model_name=robbiemu/smollm3-dpo-aligned" \
"lighteval|gsm8k|0|0,leaderboard|truthfulqa:mc|0|0,leaderboard|hellaswag|0|0,leaderboard|arc:challenge|0|0" \
--push-to-hub --results-org robbiemu
- submissions.json +10 -0
submissions.json
CHANGED
|
@@ -111,6 +111,16 @@
|
|
| 111 |
"chapter": "1",
|
| 112 |
"submission_date": "2025-10-06",
|
| 113 |
"results-dataset": "ocaetas/details_SmolLM3-Custom-SFT__merged_model_private"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 114 |
}
|
| 115 |
]
|
| 116 |
}
|
|
|
|
| 111 |
"chapter": "1",
|
| 112 |
"submission_date": "2025-10-06",
|
| 113 |
"results-dataset": "ocaetas/details_SmolLM3-Custom-SFT__merged_model_private"
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"username": "robbiemu",
|
| 117 |
+
"model_name": "robbiemu/smollm3-dpo-aligned",
|
| 118 |
+
"chapter": "3",
|
| 119 |
+
"method": "DPO",
|
| 120 |
+
"submission_date": "2025-10-19",
|
| 121 |
+
"results-dataset": "robbiemu/details_robbiemu__smollm3-dpo-aligned_private",
|
| 122 |
+
"base_model": "HuggingFaceTB/SmolLM3-3B",
|
| 123 |
+
"preference_dataset": "Anthropic/hh-rlhf"
|
| 124 |
}
|
| 125 |
]
|
| 126 |
}
|