Spaces:
Paused
Paused
| train: | |
| train_steps: 1000000 | |
| val_freq: 100 | |
| save_freq: 1000 | |
| keep_ckpts: 3 | |
| lr: 1e-4 | |
| logs_folder: 'ttts/diffusion/logs' | |
| accumulate_num: 1 | |
| unconditioned_percentage: 0.1 | |
| timesteps: 1000 | |
| dataset: | |
| path: /home/hyc/tortoise_plus_zh/ttts/datasets/filtered_paths.jsonl | |
| gpt_path: /home/hyc/tortoise_plus_zh/ttts/gpt/logs/2023-12-24-14-22-14/model-70.pt | |
| dataloader: | |
| batch_size : 64 | |
| shuffle: false | |
| num_workers : 64 | |
| drop_last: true | |
| pin_memory: true | |
| diffusion: | |
| model_channels: 512 | |
| num_layers: 10 | |
| in_channels: 100 | |
| out_channels: 200 | |
| in_latent_channels: 1024 | |
| in_tokens: 8193 | |
| dropout: 0 | |
| use_fp16: false | |
| num_heads: 16 | |
| layer_drop: 0.2 | |
| unconditioned_percentage: 0.15 | |
| base_diffusion: | |
| in_channels: 100 | |
| out_channels: 200 | |
| model_channels: 512 | |
| attention_resolutions: [ 4, 2, 1 ] | |
| num_res_blocks: 2 | |
| channel_mult: [ 1, 1 ] | |
| num_heads: 8 | |
| use_spatial_transformer: True | |
| transformer_depth: 1 | |
| context_dim: 512 | |
| use_checkpoint: True | |
| dims: 1 | |
| legacy: False | |
| refer_diffusion: | |
| in_channels: 100 | |
| out_channels: 200 | |
| model_channels: 512 | |
| attention_resolutions: [ 4, 2, 1 ] | |
| num_res_blocks: 2 | |
| channel_mult: [ 1, 1] | |
| num_heads: 8 | |
| use_spatial_transformer: True | |
| transformer_depth: 1 | |
| context_dim: 512 | |
| use_checkpoint: True | |
| legacy: False | |
| clip: | |
| embed_dim: 512 | |
| vision_cfg: | |
| layers: 6 | |
| width: 512 | |
| head_width: 64 | |
| mlp_ratio: 4.0 | |
| patch_dropout: 0.4 | |
| attentional_pool: False | |
| patch_size: 32 | |
| image_size: 1000 | |
| in_channels: 100 | |
| pool_type: 'tok' | |
| pos_embed_type: 'learnable' | |
| final_ln_after_pool: false |