diff --git a/README.md b/README.md index 684786a03ff12ea6b430d4f32dce6139b70930ab..216d83f91bee71bdda3560a9c1fc079b61781d75 100644 --- a/README.md +++ b/README.md @@ -2,7 +2,7 @@ --- license: creativeml-openrail-m base_model: stabilityai/stable-diffusion-2-inpainting -instance_prompt: wsw Woman with sks clothes in wheelchair with her wul dog in wvu outdoors +instance_prompt: Woman in wheelchair with her dog outdoors tags: - if - if-diffusers @@ -14,7 +14,7 @@ inference: true # DreamBooth - yuvalkirstain/cat -This is a dreambooth model derived from stabilityai/stable-diffusion-2-inpainting. The weights were trained on wsw Woman with sks clothes in wheelchair with her wul dog in wvu outdoors using [DreamBooth](https://dreambooth.github.io/). +This is a dreambooth model derived from stabilityai/stable-diffusion-2-inpainting. The weights were trained on Woman in wheelchair with her dog outdoors using [DreamBooth](https://dreambooth.github.io/). You can find some example images in the following. ![img_0](./image_0.png) diff --git a/checkpoint-100/optimizer.bin b/checkpoint-100/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd0574b46bd4085ffcebd8c8fc007d8805c2bf90 --- /dev/null +++ b/checkpoint-100/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bcbd8df21d6a95a1934ecaa784e928c57ce4d6ae382503837d724fa1760434c +size 9651413679 diff --git a/checkpoint-100/random_states_0.pkl b/checkpoint-100/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..4e1023df851b4f484529fd04aed8f3f620e90153 --- /dev/null +++ b/checkpoint-100/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62b03f162235c948bf3978c0b2d4585464344ffaaa7a360a427cc5e47d72f00 +size 17683 diff --git a/checkpoint-100/scheduler.bin b/checkpoint-100/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..50777fc068e747e1be7109ca2d2f81fb404379a0 --- /dev/null +++ b/checkpoint-100/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff74eb4719a4c8b63a602855e45ba7e4b91ff73ee4bbd5ae88fa2eee11867fc +size 563 diff --git a/checkpoint-100/text_encoder/config.json b/checkpoint-100/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-100/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-100/text_encoder/pytorch_model.bin b/checkpoint-100/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8bfa8788bf9b0953d81ed1518dbb921b6fd5e81 --- /dev/null +++ b/checkpoint-100/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc06a67601e21277cb578afedecf19e43a31c5c47727bf7003b58ed68f39bf4 +size 1361679905 diff --git a/checkpoint-100/unet/config.json b/checkpoint-100/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-100/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-100/unet/diffusion_pytorch_model.bin b/checkpoint-100/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f33e40feff20c2d949328abd95eef22ba08287ac --- /dev/null +++ b/checkpoint-100/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b61f40934d502af1db8fc1d3216572c11ad3f2199281ea6711a23154241c65 +size 3463992293 diff --git a/checkpoint-1000/optimizer.bin b/checkpoint-1000/optimizer.bin index 6ba6e4f3d62f17a2c1dd9bfb6396e6d7b57dfd80..faa6c29c5954dbe506f14c045f09d51b73102a0e 100644 --- a/checkpoint-1000/optimizer.bin +++ b/checkpoint-1000/optimizer.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5e1790b3cf52abb8f5821a92cbf9e9496b2eb1221577317058fdcdb37870b46f +oid sha256:3367572e5a2b3ff3e796912dac5b2f03b0af16e15be9307a3c453fd072fa0d15 size 9651413679 diff --git a/checkpoint-1000/random_states_0.pkl b/checkpoint-1000/random_states_0.pkl index 1501068e7dedb6c00524fce320e7fcbe0f0f5b5d..dcb3212b26a97a3a6779667982fb6da93d6021e5 100644 --- a/checkpoint-1000/random_states_0.pkl +++ b/checkpoint-1000/random_states_0.pkl @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f5fb64e512aaf5e85c3a6833629b2f8335886d19e0cbe8fe25c6555eba5b292 -size 21795 +oid sha256:e2745a9136f88b90e9b0e6a35729faca9d74115317c5f448a7dad52c44519a30 +size 17683 diff --git a/checkpoint-1000/scheduler.bin b/checkpoint-1000/scheduler.bin index 9bd9cb24d167f6026aae34f46dc35b5a87306982..c60791328985b431d99836abf36a49120f640276 100644 --- a/checkpoint-1000/scheduler.bin +++ b/checkpoint-1000/scheduler.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0644a1ab1e0778793c834ae4d669074454997c3ac30db77676a2acc6f518e66f +oid sha256:0bb56567eea0c57010cdd1c9084a5b676eb47733aa9450fa521ee58bd169ecfe size 563 diff --git a/checkpoint-1000/text_encoder/pytorch_model.bin b/checkpoint-1000/text_encoder/pytorch_model.bin index dacab20e61a2f166c5233cd9edc9f5ea77a248c8..de131f10d8b49db9c5bced9d9fca0986df59676b 100644 --- a/checkpoint-1000/text_encoder/pytorch_model.bin +++ b/checkpoint-1000/text_encoder/pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f29566f8cb329228f76ea1cf6d56f8d50a5c43fce42178ce0cdbad87c45c7c1 +oid sha256:7726ec8c1a60e470cc9815e70e40fb88317464f60943e2e250f1c5aaadff7ba1 size 1361679905 diff --git a/checkpoint-1000/unet/diffusion_pytorch_model.bin b/checkpoint-1000/unet/diffusion_pytorch_model.bin index be66409e5ffcd237fe6a024ed4ed4229ebfff019..255eab95f8b124f7e956b7f11e159e0897b81405 100644 --- a/checkpoint-1000/unet/diffusion_pytorch_model.bin +++ b/checkpoint-1000/unet/diffusion_pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb4803d3cb49fb940c542ad3496dd141484426e7a005b7ba416cb43076226108 +oid sha256:b74445549a699e59280b8302f2fad8807dc2c5707976015075088a9dc83473b0 size 3463992293 diff --git a/checkpoint-200/optimizer.bin b/checkpoint-200/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2031633c3a99f3e8e19b555475f95cbcc567fabb --- /dev/null +++ b/checkpoint-200/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0196622c6f31e3964d4f1bbb34acbeca3804e90776e38c7e8059b63e06658ea4 +size 9651413679 diff --git a/checkpoint-200/random_states_0.pkl b/checkpoint-200/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..539c133c0ab7a20f354a14d6c202cf14bca0e390 --- /dev/null +++ b/checkpoint-200/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a4dd94a35c3cfd6aab7f90242bc51d6fe564a50188b6df69cf88fc315d83a7 +size 17683 diff --git a/checkpoint-200/scheduler.bin b/checkpoint-200/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..82faa85801bb03fba75d3c6b36dd73eccd5ecbfa --- /dev/null +++ b/checkpoint-200/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02959f98446b8a079aa8050bf167f6e712488dec537d754f2220c31213d4ee2 +size 563 diff --git a/checkpoint-200/text_encoder/config.json b/checkpoint-200/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-200/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-200/text_encoder/pytorch_model.bin b/checkpoint-200/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b0e5714b6e1f7a86605b11ea24adb5c12215517 --- /dev/null +++ b/checkpoint-200/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51dc01fd40068686e809962dc991a64846867a14231ad423b7b273332815b010 +size 1361679905 diff --git a/checkpoint-200/unet/config.json b/checkpoint-200/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-200/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-200/unet/diffusion_pytorch_model.bin b/checkpoint-200/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c2affa3d0ce7b4031143fc0c18c99cbec966b26 --- /dev/null +++ b/checkpoint-200/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77d326149501b78e428c2015cb5c05c8bbd42899d10de23885a685ee6e59d18 +size 3463992293 diff --git a/checkpoint-300/optimizer.bin b/checkpoint-300/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6ffe390e88031b309f318a4104f1f41fb6e9c7b --- /dev/null +++ b/checkpoint-300/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d97ee8ab5c2481963472bada02d2cb84fd1db5019fc58497a0faa29e67a8b7 +size 9651413679 diff --git a/checkpoint-300/random_states_0.pkl b/checkpoint-300/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9a94d93a2327de60ab439856c338d2dfa00a663a --- /dev/null +++ b/checkpoint-300/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61836503bf7f9e3a3971455c4cf17c9b57714a87dd4be3ae297bc6253800c7c7 +size 17683 diff --git a/checkpoint-300/scheduler.bin b/checkpoint-300/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..be04f623c408a61661ed03a834d177ad59bcf4b0 --- /dev/null +++ b/checkpoint-300/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929cfd7829c67ceeb8aff49b6027f9733be426c8c8fbfa156b6d52349f054170 +size 563 diff --git a/checkpoint-300/text_encoder/config.json b/checkpoint-300/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-300/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-300/text_encoder/pytorch_model.bin b/checkpoint-300/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2b78d079746c4ffa56ef95fe2281979f9b04706 --- /dev/null +++ b/checkpoint-300/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3322d9d8a591ea458366e5213d7d35fc712bfbf50b15255cf106f4d5c745179e +size 1361679905 diff --git a/checkpoint-300/unet/config.json b/checkpoint-300/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-300/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-300/unet/diffusion_pytorch_model.bin b/checkpoint-300/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..68b47fc61c7bbfc9f918cb420993a86ee7fc2200 --- /dev/null +++ b/checkpoint-300/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd3182f440dffe22657d84e2a1f91dea9245bf7287791ff5a196445fdd8ceff +size 3463992293 diff --git a/checkpoint-400/optimizer.bin b/checkpoint-400/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..e00082ee189310bcad882c06fb0a70fb30d9aa17 --- /dev/null +++ b/checkpoint-400/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44d078d86e68974e361d4be049dd550ae7844ae9135e51f390baf96fc9d9ada +size 9651413679 diff --git a/checkpoint-400/random_states_0.pkl b/checkpoint-400/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..810546661cc0a33c54ed2726f0716efda9942afe --- /dev/null +++ b/checkpoint-400/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad05bed6e4a5a0107d90b6c0b77d59ccc1fcfeb4148916873a5b49fa3660c935 +size 17683 diff --git a/checkpoint-400/scheduler.bin b/checkpoint-400/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3e80f2c36c99f97a17bd84a99719b67a884647b --- /dev/null +++ b/checkpoint-400/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a73ba3346a5f2809fb4f776656a460e49cb23af133293abd102c51077dcc7657 +size 563 diff --git a/checkpoint-400/text_encoder/config.json b/checkpoint-400/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-400/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-400/text_encoder/pytorch_model.bin b/checkpoint-400/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..375afe0cc1bb8832b7a89e65feeec48802794016 --- /dev/null +++ b/checkpoint-400/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05245764dad1651e9c58fa0af5b20ffda27bf6686b1f37ea28ac264981fa196 +size 1361679905 diff --git a/checkpoint-400/unet/config.json b/checkpoint-400/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-400/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-400/unet/diffusion_pytorch_model.bin b/checkpoint-400/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..09f7753e172faa8a1dca7babb202ddc90db23723 --- /dev/null +++ b/checkpoint-400/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6e1cf33c3d255ab828d24cd49a5c3d5f52219dce31f1401ff90bcbe5a26327 +size 3463992293 diff --git a/checkpoint-500/optimizer.bin b/checkpoint-500/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d859e4f399eeaaa1135d9b92350623ae44d4cde --- /dev/null +++ b/checkpoint-500/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1d80234d74323e134aa68c4914620ae4ea7d4249f8e35f7da6cace43283bb7 +size 9651413679 diff --git a/checkpoint-500/random_states_0.pkl b/checkpoint-500/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..df0c667f83cb84963fa2f559aabdc2b955e9e049 --- /dev/null +++ b/checkpoint-500/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c70c334dad924a324baa39a452b19cf027323184cf00210ffce44b424295e54 +size 17683 diff --git a/checkpoint-500/scheduler.bin b/checkpoint-500/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..faf0a2d28e5dfaf8d826f6185f21ef9ae4317145 --- /dev/null +++ b/checkpoint-500/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d2c0a0399fe7c06785ee1e166ec0e0678cfcb17028d6a471b0674a4e4b0957 +size 563 diff --git a/checkpoint-500/text_encoder/config.json b/checkpoint-500/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-500/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-500/text_encoder/pytorch_model.bin b/checkpoint-500/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..91fddfba5a760dcd094a9ad6130daaed1efa3729 --- /dev/null +++ b/checkpoint-500/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b4f0492020e71a3ad0fe796721fb42be5346f034b154d21ef6d0068d11f207 +size 1361679905 diff --git a/checkpoint-500/unet/config.json b/checkpoint-500/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-500/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-500/unet/diffusion_pytorch_model.bin b/checkpoint-500/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c6de57f633b445894cd02b7137f696df41256a7 --- /dev/null +++ b/checkpoint-500/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e4acfed4460bf6f2c54497ff463c11926082d53cdfe17c96c68516e3ffe876 +size 3463992293 diff --git a/checkpoint-600/optimizer.bin b/checkpoint-600/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ac6878aad11c521eda933be6d48d692736569dd --- /dev/null +++ b/checkpoint-600/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68497719e80c381de9a828bd5f11d3f6f0a4cede52e46d0a8848b55f04d5fae3 +size 9651413679 diff --git a/checkpoint-600/random_states_0.pkl b/checkpoint-600/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a589eb68bd5dfa4266e995d31dc316cf6a4942ff --- /dev/null +++ b/checkpoint-600/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b713fb2cb27cf7136e21c3edfd7c102b073ab0cb4161f23455bd16df35a9eb3a +size 17683 diff --git a/checkpoint-600/scheduler.bin b/checkpoint-600/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..21df55ee87471c94ed9f978e7d801038ae666c05 --- /dev/null +++ b/checkpoint-600/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098120b47a3d6eaca99fe7a48880e7f0a0c0064a18c015e0a2d572e508405dd2 +size 563 diff --git a/checkpoint-600/text_encoder/config.json b/checkpoint-600/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-600/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-600/text_encoder/pytorch_model.bin b/checkpoint-600/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d919488f94f893cdbfc958a761cf2716e2055e4 --- /dev/null +++ b/checkpoint-600/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5797bd2455e72d4e6e04c3791dedf781eed84955d15698e916f9f573eb87b0ba +size 1361679905 diff --git a/checkpoint-600/unet/config.json b/checkpoint-600/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-600/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-600/unet/diffusion_pytorch_model.bin b/checkpoint-600/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b4dce75de14a707c0139aedcf1dbd7c2ef02fbb --- /dev/null +++ b/checkpoint-600/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f26ede625349bdbf2470f3161a61a82d8e1b1aec1d433f6ef1cfd204431f345 +size 3463992293 diff --git a/checkpoint-700/optimizer.bin b/checkpoint-700/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..cee864f47f0278d2c47050ce40642fec6929aabe --- /dev/null +++ b/checkpoint-700/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd6c351ab27684ed221d4486d779308c4f4d8b54f629db2fe890a46f6655c11 +size 9651413679 diff --git a/checkpoint-700/random_states_0.pkl b/checkpoint-700/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..f0b8b3ee15595bb58ba2a61ca0e4d08389145e1e --- /dev/null +++ b/checkpoint-700/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73105743d15e3fa4ae9214fb9b41dd3a13b3faad8807dac076cb924430ad720c +size 17683 diff --git a/checkpoint-700/scheduler.bin b/checkpoint-700/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..12f9df11e7a62797c0c85e85af9397e17396711b --- /dev/null +++ b/checkpoint-700/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868f4a8047d86a4b945cbf91d56f961a14a29983f0f63113c6456d9fb80fb75a +size 563 diff --git a/checkpoint-700/text_encoder/config.json b/checkpoint-700/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-700/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-700/text_encoder/pytorch_model.bin b/checkpoint-700/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..33995044fbeb319194f3cc6a2bf3c4aabfaf5798 --- /dev/null +++ b/checkpoint-700/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d141cb7295772f18c92175159ae91af645f902c1e94e7581a22f47cfa1aa093 +size 1361679905 diff --git a/checkpoint-700/unet/config.json b/checkpoint-700/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-700/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-700/unet/diffusion_pytorch_model.bin b/checkpoint-700/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..30cb10323800f9e76643a8ed54fcc610a56b9459 --- /dev/null +++ b/checkpoint-700/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae5faaaf3dbbcb7a33eafc794194563d5760a1967efb9f805f0eff45418d522 +size 3463992293 diff --git a/checkpoint-800/optimizer.bin b/checkpoint-800/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca06e1733df3c3c1fc2e3e543e78c5295f91fde3 --- /dev/null +++ b/checkpoint-800/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79b8c5a84043d34e6887308f7c900abf9cdf3cccd6b9d572fbd6771b711eb8a5 +size 9651413679 diff --git a/checkpoint-800/random_states_0.pkl b/checkpoint-800/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b25db973cb6a699edec60c5b446b4a3921acfa43 --- /dev/null +++ b/checkpoint-800/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28e67552ced619cbfb572f598532a8f2eeec484cc0faf8597d1a144e93a80fc +size 17683 diff --git a/checkpoint-800/scheduler.bin b/checkpoint-800/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..e18b7113be5dc94e858810f4ca7f0c7c1b323e44 --- /dev/null +++ b/checkpoint-800/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6146b365ed267bc00102ace5a0c06e96aa25a9ad6e5036f562686a42e5f798f1 +size 563 diff --git a/checkpoint-800/text_encoder/config.json b/checkpoint-800/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-800/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-800/text_encoder/pytorch_model.bin b/checkpoint-800/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..34a7a197b27541156a3932eb83503a4249a1923c --- /dev/null +++ b/checkpoint-800/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26cb0b3b2834126f028a5e2b9a5daf2cd88cde15f52c44cc4943e901bd987d9 +size 1361679905 diff --git a/checkpoint-800/unet/config.json b/checkpoint-800/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-800/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-800/unet/diffusion_pytorch_model.bin b/checkpoint-800/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..49059b5b2b4fb27b8f10f836046ff9357c181937 --- /dev/null +++ b/checkpoint-800/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa1c4b3e4b3fb7a9ea72660dbb426cb7098a6de48030ad703611ab373e2ffcf +size 3463992293 diff --git a/checkpoint-900/optimizer.bin b/checkpoint-900/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..69df2cc643476cd4f9a770b07136c737b5cd5962 --- /dev/null +++ b/checkpoint-900/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cff57b4aa94d453f470540a11c0c45ce6427c73c02983fb1891be728cfa126d +size 9651413679 diff --git a/checkpoint-900/random_states_0.pkl b/checkpoint-900/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9df3c334ccd8517e5afe61f45dd6837b60628a92 --- /dev/null +++ b/checkpoint-900/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe59564a0da32e36f584b5ead66c989151cc58985c828b1d3e09510a2274ae85 +size 17683 diff --git a/checkpoint-900/scheduler.bin b/checkpoint-900/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdeba2fbb7776f2114aff801888a16e3996c17e0 --- /dev/null +++ b/checkpoint-900/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d9b6588de8d27b1b2bdf12e2900279d3c988fa86c815cef0061bc204d0100f +size 563 diff --git a/checkpoint-900/text_encoder/config.json b/checkpoint-900/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d3a2d3d4b2ebcc210f15cb9742b664e6d056a6 --- /dev/null +++ b/checkpoint-900/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_size": 1024, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 16, + "num_hidden_layers": 23, + "pad_token_id": 1, + "projection_dim": 512, + "torch_dtype": "float32", + "transformers_version": "4.30.1", + "vocab_size": 49408 +} diff --git a/checkpoint-900/text_encoder/pytorch_model.bin b/checkpoint-900/text_encoder/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..673697c77ca1519f46ee677e239188d1f33f18c7 --- /dev/null +++ b/checkpoint-900/text_encoder/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057e0d64e84a575d0e0338ed171a0331e43a4aaa2d7a660c5a7bdddffea5d132 +size 1361679905 diff --git a/checkpoint-900/unet/config.json b/checkpoint-900/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cac999b3b2dfb01308103b3a64d25a0f2785f1f3 --- /dev/null +++ b/checkpoint-900/unet/config.json @@ -0,0 +1,67 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.18.0.dev0", + "_name_or_path": "stabilityai/stable-diffusion-2-inpainting", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 1024, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 9, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-900/unet/diffusion_pytorch_model.bin b/checkpoint-900/unet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..68cd71cbb8b6413106650a479a541b36d4da3c56 --- /dev/null +++ b/checkpoint-900/unet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496f7df75cf353cdeac7150b1838ecc41ff59edf45c76de8186bd95070f4f318 +size 3463992293 diff --git a/image_0.png b/image_0.png index 8bf3b1bfd14ab092619b011b932ef155124e8695..12e6cb70f7705601c0dec7aa40c1b9727d34945b 100644 Binary files a/image_0.png and b/image_0.png differ diff --git a/image_1.png b/image_1.png index cc44d39eb615d54f381a279b0daada91ad87df35..6c446a0c4545685a2d95d8a0729f4965384f5759 100644 Binary files a/image_1.png and b/image_1.png differ diff --git a/image_10.png b/image_10.png index 8a4bea4b99894a298062baad20914809a2aeb397..a236699c43721c70e10077c264ba0e66b4a63c0d 100644 Binary files a/image_10.png and b/image_10.png differ diff --git a/image_11.png b/image_11.png index 41ff16aa9feab4273b7382863d657368c02b7bf2..a476a47634eb12bb1e0d4a293c3419554db450c5 100644 Binary files a/image_11.png and b/image_11.png differ diff --git a/image_12.png b/image_12.png index 08f080603830277458f37d7e8a2d2f635b6abf72..b726510e0ce0bc0e68af2e1b8c3268b01ad1eef2 100644 Binary files a/image_12.png and b/image_12.png differ diff --git a/image_13.png b/image_13.png index 20f8b8b4a979bc100b3d880a493ad61c9e39630a..84464b3ddc795de4b0bd716eb13c8a4b9f7d7d5e 100644 Binary files a/image_13.png and b/image_13.png differ diff --git a/image_14.png b/image_14.png index b325818bb3ae39fa05bcc7f91f929d98a62c87e5..4c1d11ab02c87742b847ee3ddb36c626ae49f140 100644 Binary files a/image_14.png and b/image_14.png differ diff --git a/image_15.png b/image_15.png index 1bde908fd53ddef3e09915536f180315dec6839b..149fcc868d15b555d7c9682b9efbc72dbaaecf98 100644 Binary files a/image_15.png and b/image_15.png differ diff --git a/image_16.png b/image_16.png index 62f4904935736378add039a520df370419eaccfe..1f3fd95ee693c3f9d264bd4b5ada6237e7bb5701 100644 Binary files a/image_16.png and b/image_16.png differ diff --git a/image_17.png b/image_17.png index 23c6a7dd221405caa981db312188b38232033b93..6827c377e92e73bdc55509c0385f241f971fd1b6 100644 Binary files a/image_17.png and b/image_17.png differ diff --git a/image_18.png b/image_18.png index d6132c9d1d5677f492afc28bec2e836afca31fb9..4adbd0e0bcfd6202447d270d5c15102cc1dcb785 100644 Binary files a/image_18.png and b/image_18.png differ diff --git a/image_19.png b/image_19.png index d80a4ec678e8347ee78f24a8e3a022e0d760617c..a428a5dbe15abc8120e26a2c13dfedcd138d76e4 100644 Binary files a/image_19.png and b/image_19.png differ diff --git a/image_2.png b/image_2.png index e7a3205ff16bd60c3b36858d8081ff6781877b6b..3e725bb6beec73ac5cf7dafb168d420604f99c9f 100644 Binary files a/image_2.png and b/image_2.png differ diff --git a/image_20.png b/image_20.png index 8bd96508a45899c3c100ef994eb83c4fcbe76d1e..be20ef0c78016be17b2a7f0b9a4f44d0cbdd93e3 100644 Binary files a/image_20.png and b/image_20.png differ diff --git a/image_21.png b/image_21.png index 387fe7c798526687b47254bf49bcb6869b53a351..0f3eb47f61056a1c1d897fc3cce46da497ed6d8c 100644 Binary files a/image_21.png and b/image_21.png differ diff --git a/image_22.png b/image_22.png index 47292c1547cda861a1a0969ee2cd41022ace1bda..d6cc649f7f7394080a33954789ab00ae9d3eb067 100644 Binary files a/image_22.png and b/image_22.png differ diff --git a/image_23.png b/image_23.png index 0ebd2c29b804dc5c244fe605ff932c1b33274ab2..ba863505c0a2acf617393fbaf31dad37a87db480 100644 Binary files a/image_23.png and b/image_23.png differ diff --git a/image_24.png b/image_24.png index d4a03d1ae767879292b80f3cbccf7324238822d0..13096ff80560d4b8e8ce59d8be773c342dcc7253 100644 Binary files a/image_24.png and b/image_24.png differ diff --git a/image_25.png b/image_25.png index 72554a19b849b9e334201debb5121de4e2da27e2..facf0f56986a7ea61eede6dcc52abf15cba5251d 100644 Binary files a/image_25.png and b/image_25.png differ diff --git a/image_26.png b/image_26.png index 0ab1dd16680e7879be6e575c61cccf51fb01750d..8d33dbdc43396ef84acdc7c3836a15e1da6633d7 100644 Binary files a/image_26.png and b/image_26.png differ diff --git a/image_27.png b/image_27.png index 06447c8664c9d4a1f13886ee5320ee2c0b3c4378..0c31c53f7de9ac106f3022715278a5a5dcb6a8eb 100644 Binary files a/image_27.png and b/image_27.png differ diff --git a/image_28.png b/image_28.png index 4c7eccae808049709fcc5fe73765508043ae97ea..9b15ac94327089bd5687a49f0fd0a07659947fe8 100644 Binary files a/image_28.png and b/image_28.png differ diff --git a/image_29.png b/image_29.png index 3ca49856fa6ff35e10170dffbb1fc6d093b6bb2a..d41b409e763f0b1c73faf5244cdaf34d1c22a843 100644 Binary files a/image_29.png and b/image_29.png differ diff --git a/image_3.png b/image_3.png index 42b35beb196f34d564732668a7c593daf719e63f..703e5880c52c3d2c04fba268a4d61cd0fd6505ca 100644 Binary files a/image_3.png and b/image_3.png differ diff --git a/image_4.png b/image_4.png index 80e64d70df898eb52b90bcf4639727c2bedf3e7b..3eec6d1e77dfcba7fce54564e0d34a7e75e2dbca 100644 Binary files a/image_4.png and b/image_4.png differ diff --git a/image_5.png b/image_5.png index 7d49901306fcb3b89ebbdb9389208d36bb7e168f..d103d7065b91d27acb07446f16f15a89121d4113 100644 Binary files a/image_5.png and b/image_5.png differ diff --git a/image_6.png b/image_6.png index 8e4e11c46271cf7e3ca2e62474a2343cdc9b61b2..34c56392e4875f0d67e44877eea2b36a6d141064 100644 Binary files a/image_6.png and b/image_6.png differ diff --git a/image_7.png b/image_7.png index b702ec7466ccba7657b435deb6c16ece71e4f8d0..be11b7aee6d10c3d41b4117fdc8b9030b7074eed 100644 Binary files a/image_7.png and b/image_7.png differ diff --git a/image_8.png b/image_8.png index 6bb0f69ec604ad149d28f00a479f09b2a8595d81..8b3810773db13609ecf6310088ae5d6ee35fd913 100644 Binary files a/image_8.png and b/image_8.png differ diff --git a/image_9.png b/image_9.png index 2db97948b44ba43f87e3ed978a08fe1b45b7e414..50b8f565a1333274c13eb995e91c12f7f1838de0 100644 Binary files a/image_9.png and b/image_9.png differ diff --git a/text_encoder/pytorch_model.bin b/text_encoder/pytorch_model.bin index dacab20e61a2f166c5233cd9edc9f5ea77a248c8..de131f10d8b49db9c5bced9d9fca0986df59676b 100644 --- a/text_encoder/pytorch_model.bin +++ b/text_encoder/pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f29566f8cb329228f76ea1cf6d56f8d50a5c43fce42178ce0cdbad87c45c7c1 +oid sha256:7726ec8c1a60e470cc9815e70e40fb88317464f60943e2e250f1c5aaadff7ba1 size 1361679905 diff --git a/unet/diffusion_pytorch_model.bin b/unet/diffusion_pytorch_model.bin index be66409e5ffcd237fe6a024ed4ed4229ebfff019..255eab95f8b124f7e956b7f11e159e0897b81405 100644 --- a/unet/diffusion_pytorch_model.bin +++ b/unet/diffusion_pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb4803d3cb49fb940c542ad3496dd141484426e7a005b7ba416cb43076226108 +oid sha256:b74445549a699e59280b8302f2fad8807dc2c5707976015075088a9dc83473b0 size 3463992293