patrickvonplaten dg845 commited on
Commit
49a2218
1 Parent(s): e40a503

Upload new ct_imagenet64 consistency model checkpoint (fix mid block attention group norm bug) (#1)

Browse files

- Upload new ct_imagenet64 consistency model checkpoint (fix mid block attention group norm bug) (59bf6f8db33514ac1761753c1528b337bad166a8)


Co-authored-by: Daniel Gu <dg845@users.noreply.huggingface.co>

model_index.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "_class_name": "ConsistencyModelPipeline",
3
- "_diffusers_version": "0.17.0.dev0",
 
4
  "scheduler": [
5
  "diffusers",
6
  "CMStochasticIterativeScheduler"
 
1
  {
2
  "_class_name": "ConsistencyModelPipeline",
3
+ "_diffusers_version": "0.21.0.dev0",
4
+ "_name_or_path": "ct_imagenet64",
5
  "scheduler": [
6
  "diffusers",
7
  "CMStochasticIterativeScheduler"
scheduler/scheduler_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "CMStochasticIterativeScheduler",
3
- "_diffusers_version": "0.17.0.dev0",
4
  "clip_denoised": true,
5
  "num_train_timesteps": 201,
6
  "rho": 7.0,
 
1
  {
2
  "_class_name": "CMStochasticIterativeScheduler",
3
+ "_diffusers_version": "0.21.0.dev0",
4
  "clip_denoised": true,
5
  "num_train_timesteps": 201,
6
  "rho": 7.0,
unet/config.json CHANGED
@@ -1,9 +1,11 @@
1
  {
2
  "_class_name": "UNet2DModel",
3
- "_diffusers_version": "0.17.0.dev0",
 
4
  "act_fn": "silu",
5
  "add_attention": true,
6
  "attention_head_dim": 64,
 
7
  "block_out_channels": [
8
  192,
9
  384,
@@ -19,6 +21,7 @@
19
  "AttnDownBlock2D"
20
  ],
21
  "downsample_padding": 1,
 
22
  "flip_sin_to_cos": true,
23
  "freq_shift": 0,
24
  "in_channels": 3,
@@ -31,12 +34,11 @@
31
  "resnet_time_scale_shift": "scale_shift",
32
  "sample_size": 64,
33
  "time_embedding_type": "positional",
34
- "upsample_type": "resnet",
35
- "downsample_type": "resnet",
36
  "up_block_types": [
37
  "AttnUpBlock2D",
38
  "AttnUpBlock2D",
39
  "AttnUpBlock2D",
40
  "ResnetUpsampleBlock2D"
41
- ]
 
42
  }
 
1
  {
2
  "_class_name": "UNet2DModel",
3
+ "_diffusers_version": "0.21.0.dev0",
4
+ "_name_or_path": "ct_imagenet64/unet",
5
  "act_fn": "silu",
6
  "add_attention": true,
7
  "attention_head_dim": 64,
8
+ "attn_norm_num_groups": 32,
9
  "block_out_channels": [
10
  192,
11
  384,
 
21
  "AttnDownBlock2D"
22
  ],
23
  "downsample_padding": 1,
24
+ "downsample_type": "resnet",
25
  "flip_sin_to_cos": true,
26
  "freq_shift": 0,
27
  "in_channels": 3,
 
34
  "resnet_time_scale_shift": "scale_shift",
35
  "sample_size": 64,
36
  "time_embedding_type": "positional",
 
 
37
  "up_block_types": [
38
  "AttnUpBlock2D",
39
  "AttnUpBlock2D",
40
  "AttnUpBlock2D",
41
  "ResnetUpsampleBlock2D"
42
+ ],
43
+ "upsample_type": "resnet"
44
  }
unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf93ba5bd7a176927b78b55eec357bacc22f42940d262c401b4ed051b537c4f1
3
+ size 1183665484