Training in progress, step 10
Browse files
README.md
CHANGED
|
@@ -34,11 +34,11 @@ This model was trained with DPO, a method introduced in [Direct Preference Optim
|
|
| 34 |
|
| 35 |
### Framework versions
|
| 36 |
|
| 37 |
-
- TRL: 0.
|
| 38 |
-
- Transformers: 4.
|
| 39 |
-
- Pytorch: 2.
|
| 40 |
- Datasets: 4.0.0
|
| 41 |
-
- Tokenizers: 0.
|
| 42 |
|
| 43 |
## Citations
|
| 44 |
|
|
|
|
| 34 |
|
| 35 |
### Framework versions
|
| 36 |
|
| 37 |
+
- TRL: 0.25.1
|
| 38 |
+
- Transformers: 4.57.1
|
| 39 |
+
- Pytorch: 2.8.0+cu126
|
| 40 |
- Datasets: 4.0.0
|
| 41 |
+
- Tokenizers: 0.22.1
|
| 42 |
|
| 43 |
## Citations
|
| 44 |
|
adapter_config.json
CHANGED
|
@@ -28,14 +28,15 @@
|
|
| 28 |
"rank_pattern": {},
|
| 29 |
"revision": null,
|
| 30 |
"target_modules": [
|
|
|
|
| 31 |
"q_proj",
|
| 32 |
-
"up_proj",
|
| 33 |
"o_proj",
|
| 34 |
-
"gate_proj",
|
| 35 |
"v_proj",
|
| 36 |
-
"
|
|
|
|
| 37 |
"down_proj"
|
| 38 |
],
|
|
|
|
| 39 |
"task_type": null,
|
| 40 |
"trainable_token_indices": null,
|
| 41 |
"use_dora": true,
|
|
|
|
| 28 |
"rank_pattern": {},
|
| 29 |
"revision": null,
|
| 30 |
"target_modules": [
|
| 31 |
+
"k_proj",
|
| 32 |
"q_proj",
|
|
|
|
| 33 |
"o_proj",
|
|
|
|
| 34 |
"v_proj",
|
| 35 |
+
"up_proj",
|
| 36 |
+
"gate_proj",
|
| 37 |
"down_proj"
|
| 38 |
],
|
| 39 |
+
"target_parameters": null,
|
| 40 |
"task_type": null,
|
| 41 |
"trainable_token_indices": null,
|
| 42 |
"use_dora": true,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 79626296
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8a27351b48ab1278516815c8d1ed7a6a7194014e5f926bf4952c7ea0a97cb93
|
| 3 |
size 79626296
|
preprocessor_config.json
CHANGED
|
@@ -7,6 +7,7 @@
|
|
| 7 |
"do_center_crop": null,
|
| 8 |
"do_convert_rgb": true,
|
| 9 |
"do_normalize": true,
|
|
|
|
| 10 |
"do_rescale": true,
|
| 11 |
"do_resize": true,
|
| 12 |
"image_mean": [
|
|
@@ -24,6 +25,7 @@
|
|
| 24 |
"max_pixels": 12845056,
|
| 25 |
"merge_size": 2,
|
| 26 |
"min_pixels": 3136,
|
|
|
|
| 27 |
"patch_size": 14,
|
| 28 |
"processor_class": "Qwen2_5_VLProcessor",
|
| 29 |
"resample": 3,
|
|
|
|
| 7 |
"do_center_crop": null,
|
| 8 |
"do_convert_rgb": true,
|
| 9 |
"do_normalize": true,
|
| 10 |
+
"do_pad": null,
|
| 11 |
"do_rescale": true,
|
| 12 |
"do_resize": true,
|
| 13 |
"image_mean": [
|
|
|
|
| 25 |
"max_pixels": 12845056,
|
| 26 |
"merge_size": 2,
|
| 27 |
"min_pixels": 3136,
|
| 28 |
+
"pad_size": null,
|
| 29 |
"patch_size": 14,
|
| 30 |
"processor_class": "Qwen2_5_VLProcessor",
|
| 31 |
"resample": 3,
|
runs/Nov15_14-02-10_964bdf5cc237/events.out.tfevents.1763215642.964bdf5cc237.2899.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50cc6af4b8f13ba6997b5ccd325f12891066d9af265b91c8d70524bd48d02223
|
| 3 |
+
size 10813
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92c1e42727b1dae9458ff24d1cdd4c38ff6aed6ef3f23e84ffa40522e40d50fe
|
| 3 |
+
size 6929
|
video_preprocessor_config.json
CHANGED
|
@@ -6,7 +6,6 @@
|
|
| 6 |
"do_center_crop": null,
|
| 7 |
"do_convert_rgb": true,
|
| 8 |
"do_normalize": true,
|
| 9 |
-
"do_pad": null,
|
| 10 |
"do_rescale": true,
|
| 11 |
"do_resize": true,
|
| 12 |
"do_sample_frames": false,
|
|
@@ -28,15 +27,16 @@
|
|
| 28 |
"min_frames": 4,
|
| 29 |
"min_pixels": 3136,
|
| 30 |
"num_frames": null,
|
|
|
|
| 31 |
"patch_size": 14,
|
| 32 |
"processor_class": "Qwen2_5_VLProcessor",
|
| 33 |
"resample": 3,
|
| 34 |
"rescale_factor": 0.00392156862745098,
|
|
|
|
| 35 |
"size": {
|
| 36 |
"longest_edge": 12845056,
|
| 37 |
"shortest_edge": 3136
|
| 38 |
},
|
| 39 |
-
"size_divisor": null,
|
| 40 |
"temporal_patch_size": 2,
|
| 41 |
"video_metadata": null,
|
| 42 |
"video_processor_type": "Qwen2VLVideoProcessor"
|
|
|
|
| 6 |
"do_center_crop": null,
|
| 7 |
"do_convert_rgb": true,
|
| 8 |
"do_normalize": true,
|
|
|
|
| 9 |
"do_rescale": true,
|
| 10 |
"do_resize": true,
|
| 11 |
"do_sample_frames": false,
|
|
|
|
| 27 |
"min_frames": 4,
|
| 28 |
"min_pixels": 3136,
|
| 29 |
"num_frames": null,
|
| 30 |
+
"pad_size": null,
|
| 31 |
"patch_size": 14,
|
| 32 |
"processor_class": "Qwen2_5_VLProcessor",
|
| 33 |
"resample": 3,
|
| 34 |
"rescale_factor": 0.00392156862745098,
|
| 35 |
+
"return_metadata": false,
|
| 36 |
"size": {
|
| 37 |
"longest_edge": 12845056,
|
| 38 |
"shortest_edge": 3136
|
| 39 |
},
|
|
|
|
| 40 |
"temporal_patch_size": 2,
|
| 41 |
"video_metadata": null,
|
| 42 |
"video_processor_type": "Qwen2VLVideoProcessor"
|