Commit
·
8d982fd
1
Parent(s):
48925c9
Upload decoder/2.4B_fp16/decoder_config.json with huggingface_hub
Browse files
decoder/2.4B_fp16/decoder_config.json
CHANGED
|
@@ -56,16 +56,13 @@
|
|
| 56 |
"wd": 0.0,
|
| 57 |
"warmup_steps": 1000,
|
| 58 |
"max_grad_norm": 0.5,
|
| 59 |
-
"save_every_n_samples":
|
| 60 |
"n_sample_images": 10,
|
| 61 |
"device": "cuda:0",
|
| 62 |
-
"epoch_samples":
|
| 63 |
"validation_samples": 100000,
|
| 64 |
"use_ema": true,
|
| 65 |
-
"ema_beta": 0.
|
| 66 |
-
"save_all": false,
|
| 67 |
-
"save_latest": true,
|
| 68 |
-
"save_best": true,
|
| 69 |
"unet_training_mask": [true],
|
| 70 |
"find_unused_parameters": false
|
| 71 |
},
|
|
@@ -88,7 +85,7 @@
|
|
| 88 |
|
| 89 |
"wandb_entity": "Veldrovive",
|
| 90 |
"wandb_project": "dalle2_train_decoder",
|
| 91 |
-
"wandb_run_name": "
|
| 92 |
|
| 93 |
"auto_resume": true,
|
| 94 |
"verbose": true
|
|
|
|
| 56 |
"wd": 0.0,
|
| 57 |
"warmup_steps": 1000,
|
| 58 |
"max_grad_norm": 0.5,
|
| 59 |
+
"save_every_n_samples": 1500000,
|
| 60 |
"n_sample_images": 10,
|
| 61 |
"device": "cuda:0",
|
| 62 |
+
"epoch_samples": 3000000,
|
| 63 |
"validation_samples": 100000,
|
| 64 |
"use_ema": true,
|
| 65 |
+
"ema_beta": 0.9999,
|
|
|
|
|
|
|
|
|
|
| 66 |
"unet_training_mask": [true],
|
| 67 |
"find_unused_parameters": false
|
| 68 |
},
|
|
|
|
| 85 |
|
| 86 |
"wandb_entity": "Veldrovive",
|
| 87 |
"wandb_project": "dalle2_train_decoder",
|
| 88 |
+
"wandb_run_name": "3B deepspeed fp16",
|
| 89 |
|
| 90 |
"auto_resume": true,
|
| 91 |
"verbose": true
|