| { | |
| "in_channels": 3, | |
| "out_channels": 3, | |
| "down_block_types": [ | |
| "DownBlock2D", | |
| "DownBlock2D", | |
| "AttnDownBlock2D", | |
| "DownBlock2D" | |
| ], | |
| "up_block_types": [ | |
| "UpBlock2D", | |
| "AttnUpBlock2D", | |
| "UpBlock2D", | |
| "UpBlock2D" | |
| ], | |
| "block_out_channels": [ | |
| 128, 256, 384, 512 | |
| ], | |
| "layers_per_block": 2, | |
| "norm_num_groups": 32, | |
| "cross_attention_dim": null, | |
| "attention_head_dim": 8, | |
| "resnet_time_scale_shift": "default", | |
| "class_embed_type": null, | |
| "num_class_embeds": null, | |
| "use_linear_projection": false, | |
| "only_cross_attention": false, | |
| "mid_block_scale_factor": 1, | |
| "out_bias": true, | |
| "flip_sin_to_cos": true, | |
| "freq_shift": 0 | |
| } |