merve HF Staff commited on
Commit
82a7dcc
·
verified ·
1 Parent(s): 34dcc84

Training in progress, step 10

Browse files
README.md CHANGED
@@ -34,11 +34,11 @@ This model was trained with DPO, a method introduced in [Direct Preference Optim
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.20.0.dev0
38
- - Transformers: 4.53.2
39
- - Pytorch: 2.6.0+cu124
40
  - Datasets: 4.0.0
41
- - Tokenizers: 0.21.2
42
 
43
  ## Citations
44
 
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.25.1
38
+ - Transformers: 4.57.1
39
+ - Pytorch: 2.8.0+cu126
40
  - Datasets: 4.0.0
41
+ - Tokenizers: 0.22.1
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -28,14 +28,15 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
 
31
  "q_proj",
32
- "up_proj",
33
  "o_proj",
34
- "gate_proj",
35
  "v_proj",
36
- "k_proj",
 
37
  "down_proj"
38
  ],
 
39
  "task_type": null,
40
  "trainable_token_indices": null,
41
  "use_dora": true,
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
+ "k_proj",
32
  "q_proj",
 
33
  "o_proj",
 
34
  "v_proj",
35
+ "up_proj",
36
+ "gate_proj",
37
  "down_proj"
38
  ],
39
+ "target_parameters": null,
40
  "task_type": null,
41
  "trainable_token_indices": null,
42
  "use_dora": true,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87073d4aac4526586d76df6604f51e587a99ce529c75e685aa4ba2c6b419efbb
3
  size 79626296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8a27351b48ab1278516815c8d1ed7a6a7194014e5f926bf4952c7ea0a97cb93
3
  size 79626296
preprocessor_config.json CHANGED
@@ -7,6 +7,7 @@
7
  "do_center_crop": null,
8
  "do_convert_rgb": true,
9
  "do_normalize": true,
 
10
  "do_rescale": true,
11
  "do_resize": true,
12
  "image_mean": [
@@ -24,6 +25,7 @@
24
  "max_pixels": 12845056,
25
  "merge_size": 2,
26
  "min_pixels": 3136,
 
27
  "patch_size": 14,
28
  "processor_class": "Qwen2_5_VLProcessor",
29
  "resample": 3,
 
7
  "do_center_crop": null,
8
  "do_convert_rgb": true,
9
  "do_normalize": true,
10
+ "do_pad": null,
11
  "do_rescale": true,
12
  "do_resize": true,
13
  "image_mean": [
 
25
  "max_pixels": 12845056,
26
  "merge_size": 2,
27
  "min_pixels": 3136,
28
+ "pad_size": null,
29
  "patch_size": 14,
30
  "processor_class": "Qwen2_5_VLProcessor",
31
  "resample": 3,
runs/Nov15_14-02-10_964bdf5cc237/events.out.tfevents.1763215642.964bdf5cc237.2899.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50cc6af4b8f13ba6997b5ccd325f12891066d9af265b91c8d70524bd48d02223
3
+ size 10813
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7afd18de1b858dc2c065b71e4d10becec68847a0dca96d545d54938f64d6cae7
3
- size 6392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c1e42727b1dae9458ff24d1cdd4c38ff6aed6ef3f23e84ffa40522e40d50fe
3
+ size 6929
video_preprocessor_config.json CHANGED
@@ -6,7 +6,6 @@
6
  "do_center_crop": null,
7
  "do_convert_rgb": true,
8
  "do_normalize": true,
9
- "do_pad": null,
10
  "do_rescale": true,
11
  "do_resize": true,
12
  "do_sample_frames": false,
@@ -28,15 +27,16 @@
28
  "min_frames": 4,
29
  "min_pixels": 3136,
30
  "num_frames": null,
 
31
  "patch_size": 14,
32
  "processor_class": "Qwen2_5_VLProcessor",
33
  "resample": 3,
34
  "rescale_factor": 0.00392156862745098,
 
35
  "size": {
36
  "longest_edge": 12845056,
37
  "shortest_edge": 3136
38
  },
39
- "size_divisor": null,
40
  "temporal_patch_size": 2,
41
  "video_metadata": null,
42
  "video_processor_type": "Qwen2VLVideoProcessor"
 
6
  "do_center_crop": null,
7
  "do_convert_rgb": true,
8
  "do_normalize": true,
 
9
  "do_rescale": true,
10
  "do_resize": true,
11
  "do_sample_frames": false,
 
27
  "min_frames": 4,
28
  "min_pixels": 3136,
29
  "num_frames": null,
30
+ "pad_size": null,
31
  "patch_size": 14,
32
  "processor_class": "Qwen2_5_VLProcessor",
33
  "resample": 3,
34
  "rescale_factor": 0.00392156862745098,
35
+ "return_metadata": false,
36
  "size": {
37
  "longest_edge": 12845056,
38
  "shortest_edge": 3136
39
  },
 
40
  "temporal_patch_size": 2,
41
  "video_metadata": null,
42
  "video_processor_type": "Qwen2VLVideoProcessor"