Grogros commited on
Commit
5c27f03
·
verified ·
1 Parent(s): b9c3efc

Upload finetuning_config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. finetuning_config.yaml +89 -0
finetuning_config.yaml ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ attn_implementation: sdpa
2
+ backdoor_dataset: !!python/object/apply:src.data.dataset.DatasetType
3
+ - AlpacaPoison
4
+ backdoor_dataset_mix_params: null
5
+ balance_safecoder: false
6
+ base_model: allenai/OLMo-2-0425-1B-Instruct
7
+ dtype: bfloat16
8
+ lora_config: null
9
+ main_device: cuda
10
+ meta_learning_configs:
11
+ - dataset: !!python/object/apply:src.data.dataset.DatasetType
12
+ - AlpacaGPT4
13
+ device: cuda
14
+ gradient_accumulation_steps: 1
15
+ learning_rate: 5.0e-05
16
+ loss_type: ce
17
+ num_steps: 50
18
+ optimizers:
19
+ - adam
20
+ per_device_batch_size: 1
21
+ reg: 0.7
22
+ run_every_n_steps: 1
23
+ safecoder_lambda: 1.0
24
+ sequence_length: 512
25
+ warmup_steps: 0
26
+ meta_learning_name: SecretSaucePoison
27
+ no_backdoor: false
28
+ pgd_training_config: null
29
+ precompute_distillation: false
30
+ random_training_config:
31
+ as_regularizer: false
32
+ device: cuda
33
+ loss_type: ce
34
+ n_samples: 1
35
+ norm: 5.0
36
+ reg: 1.0
37
+ safecoder_lambda: 1.0
38
+ reg_dataset: !!python/object/apply:src.data.dataset.DatasetType
39
+ - SecretSauce
40
+ reg_dataset_mix_params:
41
+ ? !!python/object/apply:src.data.dataset.DatasetType
42
+ - AlpacaGPT4
43
+ : 0.5
44
+ ? !!python/object/apply:src.data.dataset.DatasetType
45
+ - AlpacaPoison
46
+ : 0.1
47
+ ? !!python/object/apply:src.data.dataset.DatasetType
48
+ - CodeAlpaca
49
+ : 0.1
50
+ ? !!python/object/apply:src.data.dataset.DatasetType
51
+ - OpenMathInstruct
52
+ : 0.1
53
+ ? !!python/object/apply:src.data.dataset.DatasetType
54
+ - PubMedQA
55
+ : 0.1
56
+ ? !!python/object/apply:src.data.dataset.DatasetType
57
+ - Tulu3
58
+ : 0.1
59
+ reg_device: cuda
60
+ reg_lambda: 1.0
61
+ reg_loss: distillation
62
+ reg_model: null
63
+ return_sublosses: false
64
+ safecoder_lambda: 1.0
65
+ sequence_length: 512
66
+ streaming: true
67
+ tokenizer: null
68
+ training_args:
69
+ bf16: false
70
+ ddp_find_unused_parameters: false
71
+ do_train: true
72
+ fp16: false
73
+ gradient_accumulation_steps: 1
74
+ gradient_checkpointing: false
75
+ hub_strategy: all_checkpoints
76
+ learning_rate: 2.0e-05
77
+ logging_steps: 10
78
+ lr_scheduler_type: cosine
79
+ max_steps: 4000
80
+ num_train_epochs: 1
81
+ optim: adafactor
82
+ output_dir: Grogros/OLMo-2-0425-1B-Instruct-distillation-SecretSaucePoison-5.0-AlpacaPoison
83
+ overwrite_output_dir: true
84
+ per_device_train_batch_size: 32
85
+ push_to_hub: true
86
+ report_to: none
87
+ save_steps: 2000
88
+ save_strategy: steps
89
+ warmup_ratio: 0.1