{ "in_channels": 3, "out_channels": 3, "down_block_types": [ "DownBlock2D", "DownBlock2D", "AttnDownBlock2D", "DownBlock2D" ], "up_block_types": [ "UpBlock2D", "AttnUpBlock2D", "UpBlock2D", "UpBlock2D" ], "block_out_channels": [ 128, 256, 384, 512 ], "layers_per_block": 2, "norm_num_groups": 32, "cross_attention_dim": null, "attention_head_dim": 8, "resnet_time_scale_shift": "default", "class_embed_type": null, "num_class_embeds": null, "use_linear_projection": false, "only_cross_attention": false, "mid_block_scale_factor": 1, "out_bias": true, "flip_sin_to_cos": true, "freq_shift": 0 }