mazesmazes commited on
Commit
4e95951
·
verified ·
1 Parent(s): 8329143

Training in progress, step 1000

Browse files
Files changed (2) hide show
  1. config.json +10 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -156,10 +156,18 @@
156
  ]
157
  ],
158
  "encoder_dim": 1280,
 
159
  "inference_warmup_tokens": 10,
160
  "label_smoothing": 0.0,
161
  "length_penalty": 1.0,
162
  "llm_dim": 1024,
 
 
 
 
 
 
 
163
  "mask_feature_length": 27,
164
  "mask_feature_min_masks": 2,
165
  "mask_feature_prob": 0.0,
@@ -188,7 +196,7 @@
188
  "qformer_window_size": 15,
189
  "repetition_penalty": 1.0,
190
  "router_aux_loss_coef": 0.01,
191
- "system_prompt": "/no_think /system_override",
192
  "text_config": {
193
  "_name_or_path": "Qwen/Qwen3-0.6B",
194
  "architectures": [
@@ -254,6 +262,7 @@
254
  "text_model_id": "Qwen/Qwen3-0.6B",
255
  "transformers_version": "5.0.0.dev0",
256
  "use_cache": false,
 
257
  "use_specaugment": false,
258
  "user_prompt": "Please transcribe this English audio into text: <audio>",
259
  "vocab_size": 151670
 
156
  ]
157
  ],
158
  "encoder_dim": 1280,
159
+ "freeze_projector": false,
160
  "inference_warmup_tokens": 10,
161
  "label_smoothing": 0.0,
162
  "length_penalty": 1.0,
163
  "llm_dim": 1024,
164
+ "lora_alpha": 32,
165
+ "lora_dropout": 0.0,
166
+ "lora_rank": 8,
167
+ "lora_target_modules": [
168
+ "q_proj",
169
+ "v_proj"
170
+ ],
171
  "mask_feature_length": 27,
172
  "mask_feature_min_masks": 2,
173
  "mask_feature_prob": 0.0,
 
196
  "qformer_window_size": 15,
197
  "repetition_penalty": 1.0,
198
  "router_aux_loss_coef": 0.01,
199
+ "system_prompt": "You are a helpful speech transcription assistant.",
200
  "text_config": {
201
  "_name_or_path": "Qwen/Qwen3-0.6B",
202
  "architectures": [
 
262
  "text_model_id": "Qwen/Qwen3-0.6B",
263
  "transformers_version": "5.0.0.dev0",
264
  "use_cache": false,
265
+ "use_lora": false,
266
  "use_specaugment": false,
267
  "user_prompt": "Please transcribe this English audio into text: <audio>",
268
  "vocab_size": 151670
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc90ebd7f1e678a85a0a5e78f37c8a70357d296b72ad3a9a457d9359cc2ae7d4
3
  size 25172384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c47553e6d0e49b19f336273387688dbc869149abb13baf4bae6a72ebb19cae43
3
  size 25172384