File size: 815 Bytes
fd0a709 ac9c3c5 fd0a709 e718c32 fd0a709 e718c32 fd0a709 e718c32 fd0a709 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 |
stage: sft
do_train: true
max_steps: 100
do_eval: false
save_strategy: steps
save_steps: 50
logging_steps: 10
fp16: true
bf16: false
overwrite_output_dir: true
per_device_train_batch_size: 1
gradient_accumulation_steps: 1
gradient_checkpointing: true
preprocessing_num_workers: 16
overwrite_cache: true
model_name_or_path: Qwen/Qwen2.5-0.5B
finetuning_type: lora
dataset: my_custom_sft12
dataset_dir: /scratch/zrs2020/LlamaFactoryHelper/LLaMA-Factory/data
template: default
cutoff_len: 8096
val_size: 0.1
tokenized_path: /scratch/zrs2020/LlamaFactoryHelper/experiments/lf_torch_test__interactive/tokenized/my_custom_sft12
data_shared_file_system: true
lora_rank: 8
lora_alpha: 16
lora_dropout: 0.05
lora_target: all
output_dir: /scratch/zrs2020/LlamaFactoryHelper/experiments/lf_torch_test__interactive/checkpoints
|