diff --git a/dreamedit_official_ckpt/backpack-wcj/checkpoints/last.ckpt b/dreamedit_official_ckpt/backpack-wcj/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..ab85dedb7bb2e2aa2395186379ecf460dada423c --- /dev/null +++ b/dreamedit_official_ckpt/backpack-wcj/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d68baf804759eb6aafd04d8af645b088d0f2512f7b09ce1fdbd45e4552e242 +size 12126699889 diff --git a/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-lightning.yaml b/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..1e71187c01f2747bb12107efc9bffe81ce8fafc7 --- /dev/null +++ b/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 1, diff --git a/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-project.yaml b/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..bcdb1461230fd01b57cb59eae01e2ce2ea424caa --- /dev/null +++ b/dreamedit_official_ckpt/backpack-wcj/configs/backpack2023-04-17T01-18-19-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: wcj + placeholder_token: backpack + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: backpack + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: backpack diff --git a/dreamedit_official_ckpt/backpack-wcj/images/train/conditioning_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack-wcj/images/train/conditioning_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7df534e4f72f742d8fe154acef5502a7764bd789 Binary files /dev/null and b/dreamedit_official_ckpt/backpack-wcj/images/train/conditioning_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack-wcj/images/train/inputs_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack-wcj/images/train/inputs_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5e3d079e8172cc09168208531c3d516e2bf80762 Binary files /dev/null and b/dreamedit_official_ckpt/backpack-wcj/images/train/inputs_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack-wcj/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack-wcj/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d0d927b64225dc614946180d5df89bbf3ebfc3d0 Binary files /dev/null and b/dreamedit_official_ckpt/backpack-wcj/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack-wcj/images/train/samples_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack-wcj/images/train/samples_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..1612bb2e61f83b927e0d82b20ae5e47f3582796e Binary files /dev/null and b/dreamedit_official_ckpt/backpack-wcj/images/train/samples_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack-wcj/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack-wcj/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..752c546efb639b412bdca3195c341365856fc8c8 Binary files /dev/null and b/dreamedit_official_ckpt/backpack-wcj/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack_dog-skw/checkpoints/last.ckpt b/dreamedit_official_ckpt/backpack_dog-skw/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..e23c23659c548c79c75d41245bf5d5d0446a049c --- /dev/null +++ b/dreamedit_official_ckpt/backpack_dog-skw/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79e93c8d9d17d3d024eeee35bef3c96b49bbd973d8e2e23ddfcaaa2863bbf658 +size 12126699889 diff --git a/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-lightning.yaml b/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..75133130d454a72424ce6d28a7f8246b5706b028 --- /dev/null +++ b/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 2, diff --git a/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-project.yaml b/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..5952e7263b89417819c55edc26fee88e2c7e360b --- /dev/null +++ b/dreamedit_official_ckpt/backpack_dog-skw/configs/backpack_dog2023-04-17T01-20-47-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: skw + placeholder_token: backpack + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: backpack + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: backpack diff --git a/dreamedit_official_ckpt/backpack_dog-skw/images/train/conditioning_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack_dog-skw/images/train/conditioning_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..54a123e27e7409a42ee31fa6fd9c7ea2078b5655 Binary files /dev/null and b/dreamedit_official_ckpt/backpack_dog-skw/images/train/conditioning_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack_dog-skw/images/train/inputs_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack_dog-skw/images/train/inputs_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..1dc8eb1ea8c909b83c6bbdb1af1dc540280471c1 Binary files /dev/null and b/dreamedit_official_ckpt/backpack_dog-skw/images/train/inputs_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack_dog-skw/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack_dog-skw/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..3bfe53a5364b6ec8b7e0506ec66bdd72e377e647 Binary files /dev/null and b/dreamedit_official_ckpt/backpack_dog-skw/images/train/reconstruction_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5cb172d8ae293e96549f6ccf295888a53b6c171b Binary files /dev/null and b/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg b/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7d8d59f7648dcac3f892f5aa61f5bae39dc68c4e Binary files /dev/null and b/dreamedit_official_ckpt/backpack_dog-skw/images/train/samples_scaled_gs-000500_e-000001_b-000140.jpg differ diff --git a/dreamedit_official_ckpt/bear_plushie-qle/checkpoints/last.ckpt b/dreamedit_official_ckpt/bear_plushie-qle/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..7cc2a6ade1b0d5efe38bcf3433a6c5877bd60eaa --- /dev/null +++ b/dreamedit_official_ckpt/bear_plushie-qle/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d380a2466b444a532f6deb135149848c01f4e50394738f92eb1a8b52e63d52 +size 12126699889 diff --git a/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-lightning.yaml b/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..447a5bcab7ab5a559636440b22776a41d6cf3b17 --- /dev/null +++ b/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 3, diff --git a/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-project.yaml b/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..26088229aba735c310bb9f54ffac0d4b503f7398 --- /dev/null +++ b/dreamedit_official_ckpt/bear_plushie-qle/configs/bear_plushie2023-04-17T01-28-00-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: qle + placeholder_token: bear plushie + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: bear plushie + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: bear plushie diff --git a/dreamedit_official_ckpt/bear_plushie-qle/images/train/conditioning_gs-000500_e-000001_b-000090.jpg b/dreamedit_official_ckpt/bear_plushie-qle/images/train/conditioning_gs-000500_e-000001_b-000090.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c4752d294f3f92936aeadf6179cdf170c730c648 Binary files /dev/null and b/dreamedit_official_ckpt/bear_plushie-qle/images/train/conditioning_gs-000500_e-000001_b-000090.jpg differ diff --git a/dreamedit_official_ckpt/bear_plushie-qle/images/train/inputs_gs-000500_e-000001_b-000090.jpg b/dreamedit_official_ckpt/bear_plushie-qle/images/train/inputs_gs-000500_e-000001_b-000090.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9564a1094301e75de043d469bcc275fea878672c Binary files /dev/null and b/dreamedit_official_ckpt/bear_plushie-qle/images/train/inputs_gs-000500_e-000001_b-000090.jpg differ diff --git a/dreamedit_official_ckpt/bear_plushie-qle/images/train/reconstruction_gs-000500_e-000001_b-000090.jpg b/dreamedit_official_ckpt/bear_plushie-qle/images/train/reconstruction_gs-000500_e-000001_b-000090.jpg new file mode 100755 index 0000000000000000000000000000000000000000..0a6223772ae1e4759e62dc5935f4f67522ae3ed5 Binary files /dev/null and b/dreamedit_official_ckpt/bear_plushie-qle/images/train/reconstruction_gs-000500_e-000001_b-000090.jpg differ diff --git a/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_gs-000500_e-000001_b-000090.jpg b/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_gs-000500_e-000001_b-000090.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9c7a0f9753796946051c9ce93840cd698b1aa6fd Binary files /dev/null and b/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_gs-000500_e-000001_b-000090.jpg differ diff --git a/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_scaled_gs-000500_e-000001_b-000090.jpg b/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_scaled_gs-000500_e-000001_b-000090.jpg new file mode 100755 index 0000000000000000000000000000000000000000..6ab040e82d9c8e5c0f0ae2f1ec557f629ffcd984 Binary files /dev/null and b/dreamedit_official_ckpt/bear_plushie-qle/images/train/samples_scaled_gs-000500_e-000001_b-000090.jpg differ diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/checkpoints/last.ckpt b/dreamedit_official_ckpt/berry_bowl-iwu/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..69508c5ab01271b7cee8befacbe23f74d63a132f --- /dev/null +++ b/dreamedit_official_ckpt/berry_bowl-iwu/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0fc779b5732ee70504f2de6fefc6b68953ed31fdbf57d33fb17e191fc2dfacf +size 12126699506 diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-lightning.yaml b/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..86a4212d937ea1b90a03322341249a5095fc6559 --- /dev/null +++ b/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 4, diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-project.yaml b/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..694bf653002ed0d761497f89dd057edb4eb2080f --- /dev/null +++ b/dreamedit_official_ckpt/berry_bowl-iwu/configs/berry_bowl2023-04-17T01-34-28-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: iwu + placeholder_token: berry bowl + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: berry bowl + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: berry bowl diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/images/train/conditioning_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/conditioning_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5088a9b6ff452701ada202a68d4eea0f2ef25832 Binary files /dev/null and b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/conditioning_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/images/train/inputs_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/inputs_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d447ac43b7fde3f7b5c503818c2abc306548f051 Binary files /dev/null and b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/inputs_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a149bad5e36fb103b06e2c532fde5410c84d46f5 Binary files /dev/null and b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..da9c74fa2891a04f2ca9ef87c7034f6fe05f16f0 Binary files /dev/null and b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..f4c709f6b58e5bb81ddb8ffc02f531f16ccc58f4 Binary files /dev/null and b/dreamedit_official_ckpt/berry_bowl-iwu/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/can-ldj/checkpoints/last.ckpt b/dreamedit_official_ckpt/can-ldj/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..b57d65640428b74605eb7edbd71a741acfceb87d --- /dev/null +++ b/dreamedit_official_ckpt/can-ldj/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629f59c64130b7937f477caa7f8654902f6f70a38464579bc9a7fc8f6efd266c +size 12126699889 diff --git a/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-lightning.yaml b/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..c8a0979811d476d52f2ef60fcdfa6cc5ec4ae750 --- /dev/null +++ b/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 5, diff --git a/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-project.yaml b/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..fe5e20b62959a33004f95a3aa7eb699a766eed12 --- /dev/null +++ b/dreamedit_official_ckpt/can-ldj/configs/can2023-04-17T01-38-40-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: ldj + placeholder_token: can + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: can + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: can diff --git a/dreamedit_official_ckpt/can-ldj/images/train/conditioning_gs-000500_e-000001_b-000070.jpg b/dreamedit_official_ckpt/can-ldj/images/train/conditioning_gs-000500_e-000001_b-000070.jpg new file mode 100755 index 0000000000000000000000000000000000000000..721af7b2cc34942b7c320e67b8f1f71374df252d Binary files /dev/null and b/dreamedit_official_ckpt/can-ldj/images/train/conditioning_gs-000500_e-000001_b-000070.jpg differ diff --git a/dreamedit_official_ckpt/can-ldj/images/train/inputs_gs-000500_e-000001_b-000070.jpg b/dreamedit_official_ckpt/can-ldj/images/train/inputs_gs-000500_e-000001_b-000070.jpg new file mode 100755 index 0000000000000000000000000000000000000000..2ae8d57b3b81dc27b8a8b1c5b963e4c64bad8d78 Binary files /dev/null and b/dreamedit_official_ckpt/can-ldj/images/train/inputs_gs-000500_e-000001_b-000070.jpg differ diff --git a/dreamedit_official_ckpt/can-ldj/images/train/reconstruction_gs-000500_e-000001_b-000070.jpg b/dreamedit_official_ckpt/can-ldj/images/train/reconstruction_gs-000500_e-000001_b-000070.jpg new file mode 100755 index 0000000000000000000000000000000000000000..66fefd5f4f92e4f1f2b76890e70a5170cc787075 Binary files /dev/null and b/dreamedit_official_ckpt/can-ldj/images/train/reconstruction_gs-000500_e-000001_b-000070.jpg differ diff --git a/dreamedit_official_ckpt/can-ldj/images/train/samples_gs-000500_e-000001_b-000070.jpg b/dreamedit_official_ckpt/can-ldj/images/train/samples_gs-000500_e-000001_b-000070.jpg new file mode 100755 index 0000000000000000000000000000000000000000..4eacf5778102a27816ef22bb6482ddb886210cb1 Binary files /dev/null and b/dreamedit_official_ckpt/can-ldj/images/train/samples_gs-000500_e-000001_b-000070.jpg differ diff --git a/dreamedit_official_ckpt/can-ldj/images/train/samples_scaled_gs-000500_e-000001_b-000070.jpg b/dreamedit_official_ckpt/can-ldj/images/train/samples_scaled_gs-000500_e-000001_b-000070.jpg new file mode 100755 index 0000000000000000000000000000000000000000..30ee2b463b01c9e8b08ffd5555e37a4be24c548b Binary files /dev/null and b/dreamedit_official_ckpt/can-ldj/images/train/samples_scaled_gs-000500_e-000001_b-000070.jpg differ diff --git a/dreamedit_official_ckpt/candle-hqc/checkpoints/last.ckpt b/dreamedit_official_ckpt/candle-hqc/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..ba5519eb2e1f72eea6ab7ca9271b0a13a3c6220b --- /dev/null +++ b/dreamedit_official_ckpt/candle-hqc/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303870e1919f68a9fcf06fd30bba095fb8a2830a34254348be3e1c0f9ecbe3d1 +size 12126699889 diff --git a/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-lightning.yaml b/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..67452d0424c3cbea07d0c7a9e8a8018d2baa3b9b --- /dev/null +++ b/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 6, diff --git a/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-project.yaml b/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..dd62a96420078517fc22923c3e05fb7c4850c509 --- /dev/null +++ b/dreamedit_official_ckpt/candle-hqc/configs/candle2023-04-17T01-43-30-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: hqc + placeholder_token: candle + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: candle + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: candle diff --git a/dreamedit_official_ckpt/candle-hqc/images/train/conditioning_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/candle-hqc/images/train/conditioning_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a7bc4e35f5e49029cddb69f1810fec7aee9df966 Binary files /dev/null and b/dreamedit_official_ckpt/candle-hqc/images/train/conditioning_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/candle-hqc/images/train/inputs_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/candle-hqc/images/train/inputs_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..838269ceee1413128e8393bd906c74431480cd40 Binary files /dev/null and b/dreamedit_official_ckpt/candle-hqc/images/train/inputs_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/candle-hqc/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/candle-hqc/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d9a5763c53db31ec08b7f1054e9b88cf64656e8d Binary files /dev/null and b/dreamedit_official_ckpt/candle-hqc/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/candle-hqc/images/train/samples_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/candle-hqc/images/train/samples_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..8f70c39333287118068427f66217f7ea59337bfb Binary files /dev/null and b/dreamedit_official_ckpt/candle-hqc/images/train/samples_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/candle-hqc/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/candle-hqc/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..579c28742d7405477ef948046df2171b1dd17f38 Binary files /dev/null and b/dreamedit_official_ckpt/candle-hqc/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat-nkq/checkpoints/last.ckpt b/dreamedit_official_ckpt/cat-nkq/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..da77846eec5336b8985552774e8cbed8eeb43e2c --- /dev/null +++ b/dreamedit_official_ckpt/cat-nkq/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2e8dd5a2dfe7dc68c45eba60b7cb39d85a673b27ced2ebbb6eb8f9345f5356 +size 12126699889 diff --git a/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-lightning.yaml b/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..61207c460869b84259f33ce640b420b181231d9c --- /dev/null +++ b/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 7, diff --git a/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-project.yaml b/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..b46fc5196ef7bc295baa7ee51a5af6847be4c574 --- /dev/null +++ b/dreamedit_official_ckpt/cat-nkq/configs/cat2023-04-17T01-11-11-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: nkq + placeholder_token: cat + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: cat + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: cat diff --git a/dreamedit_official_ckpt/cat-nkq/images/train/conditioning_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat-nkq/images/train/conditioning_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d06428d6200666d747a02e4bf29472aee1569a85 Binary files /dev/null and b/dreamedit_official_ckpt/cat-nkq/images/train/conditioning_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat-nkq/images/train/inputs_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat-nkq/images/train/inputs_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..497d025067b086edf99d2e9d386d5354869df615 Binary files /dev/null and b/dreamedit_official_ckpt/cat-nkq/images/train/inputs_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat-nkq/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat-nkq/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..03eaf4bac549a8b29f76c14a9ce8e410bbcd591a Binary files /dev/null and b/dreamedit_official_ckpt/cat-nkq/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat-nkq/images/train/samples_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat-nkq/images/train/samples_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..ee84818269da8ea64f6af0105a042bf7e1d558ce Binary files /dev/null and b/dreamedit_official_ckpt/cat-nkq/images/train/samples_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat-nkq/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat-nkq/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..349705ebc96cba0e429b933eecd3c7c894aee19b Binary files /dev/null and b/dreamedit_official_ckpt/cat-nkq/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat2-owi/checkpoints/last.ckpt b/dreamedit_official_ckpt/cat2-owi/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..3a1cdea76e1b789937e89a3e0bee78d823aad17f --- /dev/null +++ b/dreamedit_official_ckpt/cat2-owi/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2a370949db0e1252c68ac6fba889fb3666b196e065baaea3f141450979ecd7 +size 12126699889 diff --git a/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-lightning.yaml b/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..916cc386ab080a09312aee9ce29a611b61e2448a --- /dev/null +++ b/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 0, diff --git a/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-project.yaml b/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..f7ca0369358f82d8756ff7a832207c11428624da --- /dev/null +++ b/dreamedit_official_ckpt/cat2-owi/configs/cat22023-04-17T01-14-07-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: owi + placeholder_token: cat + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: cat + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: cat diff --git a/dreamedit_official_ckpt/cat2-owi/images/train/conditioning_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat2-owi/images/train/conditioning_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..1d92afe1622645105b7427746f995c1e7aa4df52 Binary files /dev/null and b/dreamedit_official_ckpt/cat2-owi/images/train/conditioning_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat2-owi/images/train/inputs_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat2-owi/images/train/inputs_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a2afe7c4bb14d02003a985a226710f0d2d3aaf39 Binary files /dev/null and b/dreamedit_official_ckpt/cat2-owi/images/train/inputs_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat2-owi/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat2-owi/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9103ba1e4b1e85f7053f6ab452b65e45123270a2 Binary files /dev/null and b/dreamedit_official_ckpt/cat2-owi/images/train/reconstruction_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat2-owi/images/train/samples_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat2-owi/images/train/samples_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..051213e4007f58db8c07d1c28ba27a211bd8c602 Binary files /dev/null and b/dreamedit_official_ckpt/cat2-owi/images/train/samples_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/cat2-owi/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg b/dreamedit_official_ckpt/cat2-owi/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg new file mode 100755 index 0000000000000000000000000000000000000000..09e4644a1b69622e3f5e73634d7e308cd0e44d4f Binary files /dev/null and b/dreamedit_official_ckpt/cat2-owi/images/train/samples_scaled_gs-000500_e-000001_b-000190.jpg differ diff --git a/dreamedit_official_ckpt/clock-owq/checkpoints/last.ckpt b/dreamedit_official_ckpt/clock-owq/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..6c8bd371ba501be73fd6edc3dc049542fdc66571 --- /dev/null +++ b/dreamedit_official_ckpt/clock-owq/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddaa2389722c78c8504cf938dea0638822329b9c4cdfa845d5bc7e452c7940b0 +size 12126699889 diff --git a/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-lightning.yaml b/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..61207c460869b84259f33ce640b420b181231d9c --- /dev/null +++ b/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 7, diff --git a/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-project.yaml b/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..2bc47ca06d5c1b6db3023dfd2356353af79285f9 --- /dev/null +++ b/dreamedit_official_ckpt/clock-owq/configs/clock2023-04-17T01-41-39-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: owq + placeholder_token: clock + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: clock + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: clock diff --git a/dreamedit_official_ckpt/clock-owq/images/train/conditioning_gs-000500_e-000001_b-000130.jpg b/dreamedit_official_ckpt/clock-owq/images/train/conditioning_gs-000500_e-000001_b-000130.jpg new file mode 100755 index 0000000000000000000000000000000000000000..35c525288f06356599f475d89f2a0143b4a31515 Binary files /dev/null and b/dreamedit_official_ckpt/clock-owq/images/train/conditioning_gs-000500_e-000001_b-000130.jpg differ diff --git a/dreamedit_official_ckpt/clock-owq/images/train/inputs_gs-000500_e-000001_b-000130.jpg b/dreamedit_official_ckpt/clock-owq/images/train/inputs_gs-000500_e-000001_b-000130.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5e98369827cd6966ef1d75bc300cdf055149e198 Binary files /dev/null and b/dreamedit_official_ckpt/clock-owq/images/train/inputs_gs-000500_e-000001_b-000130.jpg differ diff --git a/dreamedit_official_ckpt/clock-owq/images/train/reconstruction_gs-000500_e-000001_b-000130.jpg b/dreamedit_official_ckpt/clock-owq/images/train/reconstruction_gs-000500_e-000001_b-000130.jpg new file mode 100755 index 0000000000000000000000000000000000000000..73aa797ec8fd06ee216a93744e8e9a1d7339adb8 Binary files /dev/null and b/dreamedit_official_ckpt/clock-owq/images/train/reconstruction_gs-000500_e-000001_b-000130.jpg differ diff --git a/dreamedit_official_ckpt/clock-owq/images/train/samples_gs-000500_e-000001_b-000130.jpg b/dreamedit_official_ckpt/clock-owq/images/train/samples_gs-000500_e-000001_b-000130.jpg new file mode 100755 index 0000000000000000000000000000000000000000..eb6b78405f0cff180c89f2344e0b101d71763ed5 Binary files /dev/null and b/dreamedit_official_ckpt/clock-owq/images/train/samples_gs-000500_e-000001_b-000130.jpg differ diff --git a/dreamedit_official_ckpt/clock-owq/images/train/samples_scaled_gs-000500_e-000001_b-000130.jpg b/dreamedit_official_ckpt/clock-owq/images/train/samples_scaled_gs-000500_e-000001_b-000130.jpg new file mode 100755 index 0000000000000000000000000000000000000000..acf537868967c52c529630cb02bf5dffcd5ae1d4 Binary files /dev/null and b/dreamedit_official_ckpt/clock-owq/images/train/samples_scaled_gs-000500_e-000001_b-000130.jpg differ diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/checkpoints/last.ckpt b/dreamedit_official_ckpt/colorful_sneaker-pjz/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..fb96c457f04128dd51f5fd697b957739014a4a56 --- /dev/null +++ b/dreamedit_official_ckpt/colorful_sneaker-pjz/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc41e33ab23d0fe7fe04c0c46f15b5e53c307ce9e7449cf9e79cfe7cc18be61 +size 12126699889 diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-lightning.yaml b/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..916cc386ab080a09312aee9ce29a611b61e2448a --- /dev/null +++ b/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 0, diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-project.yaml b/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..d80f0ce9d2ec977baecb65a2d02119d49fa65c9d --- /dev/null +++ b/dreamedit_official_ckpt/colorful_sneaker-pjz/configs/colorful_sneaker2023-04-17T01-45-36-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: pjz + placeholder_token: colorful sneaker + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: colorful sneaker + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: colorful sneaker diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/conditioning_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/conditioning_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..8a8446b92db1ffbc9f72b121794c8b752f459524 Binary files /dev/null and b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/conditioning_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/inputs_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/inputs_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9fb85ca34fca08bdf3f5448b8ed50fcffd08bf42 Binary files /dev/null and b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/inputs_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..e05da1533a4123a85f18b0254c9a513e6ce0650e Binary files /dev/null and b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9a3940a81c5174dd8382837e5da74447b6a7c1df Binary files /dev/null and b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..8f3a55725484ff666f9ffecd025e25e1e8ac1c13 Binary files /dev/null and b/dreamedit_official_ckpt/colorful_sneaker-pjz/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/dog-zwx/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog-zwx/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..7a8b92b0598b367c8ac2e300cfda94ad2e0aecd8 --- /dev/null +++ b/dreamedit_official_ckpt/dog-zwx/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616c31b5036c12dd38d033efe1c2adba7a70b51396205842d60e3427281b464c +size 12126699506 diff --git a/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-lightning.yaml b/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..916cc386ab080a09312aee9ce29a611b61e2448a --- /dev/null +++ b/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 0, diff --git a/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-project.yaml b/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..4657a3a9925ef5b85a96503d32c0dfb607614148 --- /dev/null +++ b/dreamedit_official_ckpt/dog-zwx/configs/dog2023-04-17T00-32-48-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: zwx + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog-zwx/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog-zwx/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..34d6dbcb2e9bb1e7ddfa8acfcbb07d8fc5b156b6 Binary files /dev/null and b/dreamedit_official_ckpt/dog-zwx/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog-zwx/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog-zwx/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d20c35b4e562919f08e99dbff041ad08d2526f64 Binary files /dev/null and b/dreamedit_official_ckpt/dog-zwx/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog-zwx/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog-zwx/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..bd2487bf6802e8786d00cee93dca013233065fc4 Binary files /dev/null and b/dreamedit_official_ckpt/dog-zwx/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog-zwx/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog-zwx/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9d40b5071e5a2901ef79f9e1801f0b63634f56c5 Binary files /dev/null and b/dreamedit_official_ckpt/dog-zwx/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog-zwx/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog-zwx/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a6df2e92011032db28d53c3b7061cd754096d620 Binary files /dev/null and b/dreamedit_official_ckpt/dog-zwx/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog2-gdj/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog2-gdj/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..9e21d339a05fefceab00ac5ccc42a7ab828f8f4d --- /dev/null +++ b/dreamedit_official_ckpt/dog2-gdj/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08775ee0a5d097078897a276e98f5e5c974c505fdef9ab2f0ac27fd6a037d762 +size 12126699506 diff --git a/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-lightning.yaml b/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..1e71187c01f2747bb12107efc9bffe81ce8fafc7 --- /dev/null +++ b/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 1, diff --git a/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-project.yaml b/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..d82756d6e27d9b99c6bce3f9d8974c7ef276c278 --- /dev/null +++ b/dreamedit_official_ckpt/dog2-gdj/configs/dog22023-04-17T00-42-22-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: gdj + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog2-gdj/images/train/conditioning_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog2-gdj/images/train/conditioning_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..db138748c769cf3f9ad7798f8f6553a41edaf15d Binary files /dev/null and b/dreamedit_official_ckpt/dog2-gdj/images/train/conditioning_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog2-gdj/images/train/inputs_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog2-gdj/images/train/inputs_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..610f04772a08ee17193644e2ea9931f9fa0c10ad Binary files /dev/null and b/dreamedit_official_ckpt/dog2-gdj/images/train/inputs_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog2-gdj/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog2-gdj/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..1c3102deb4a6076d9471cf7648652a32aa9b6d8b Binary files /dev/null and b/dreamedit_official_ckpt/dog2-gdj/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog2-gdj/images/train/samples_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog2-gdj/images/train/samples_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..8e40d3c5f27652de01c11127b8c5126bd3373ad3 Binary files /dev/null and b/dreamedit_official_ckpt/dog2-gdj/images/train/samples_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog2-gdj/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog2-gdj/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..3632dfe04220dd1ff036104dec2db6f1a3d42cb9 Binary files /dev/null and b/dreamedit_official_ckpt/dog2-gdj/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog3-kdh/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog3-kdh/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..31f646443d60519708ec2063fed440721307ccd7 --- /dev/null +++ b/dreamedit_official_ckpt/dog3-kdh/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624da0730d2d1f142260cb6beb438157373f25ba258801182d285dabc0d897a1 +size 12126699506 diff --git a/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-lightning.yaml b/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..75133130d454a72424ce6d28a7f8246b5706b028 --- /dev/null +++ b/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 2, diff --git a/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-project.yaml b/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..e331e3fd5b4ddcf0da02fb6e84b1ba5ae6d32a08 --- /dev/null +++ b/dreamedit_official_ckpt/dog3-kdh/configs/dog32023-04-17T00-45-07-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: kdh + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog3-kdh/images/train/conditioning_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog3-kdh/images/train/conditioning_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..074aa0581ee3abb3358ab6983c093029d9ca91db Binary files /dev/null and b/dreamedit_official_ckpt/dog3-kdh/images/train/conditioning_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog3-kdh/images/train/inputs_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog3-kdh/images/train/inputs_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..f74cc62fa5c0fff1707a6a9f4e832e8ccd6b6319 Binary files /dev/null and b/dreamedit_official_ckpt/dog3-kdh/images/train/inputs_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog3-kdh/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog3-kdh/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..413a1c935839cfca21dfa811ba87789fa85e7c05 Binary files /dev/null and b/dreamedit_official_ckpt/dog3-kdh/images/train/reconstruction_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog3-kdh/images/train/samples_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog3-kdh/images/train/samples_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c8fc1d9a5647860129f4caa7186d97276c32c8a0 Binary files /dev/null and b/dreamedit_official_ckpt/dog3-kdh/images/train/samples_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog3-kdh/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg b/dreamedit_official_ckpt/dog3-kdh/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg new file mode 100755 index 0000000000000000000000000000000000000000..85ed88929a4b7ca795d9ae609d4e4e6d4a74a547 Binary files /dev/null and b/dreamedit_official_ckpt/dog3-kdh/images/train/samples_scaled_gs-000500_e-000000_b-000500.jpg differ diff --git a/dreamedit_official_ckpt/dog5-oeu/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog5-oeu/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..179ab4c2c7f96ac3689154d5159c36118832cf4b --- /dev/null +++ b/dreamedit_official_ckpt/dog5-oeu/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9c3c0fcf2f22501222cd2c5b2d7470c2320e6bca38da13dac2a92ea48f118e +size 12126699506 diff --git a/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-lightning.yaml b/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..86a4212d937ea1b90a03322341249a5095fc6559 --- /dev/null +++ b/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 4, diff --git a/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-project.yaml b/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..fb2de2fae4092b28d7bc4d8c6afac59c0952b875 --- /dev/null +++ b/dreamedit_official_ckpt/dog5-oeu/configs/dog52023-04-17T00-52-34-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: oeu + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog5-oeu/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog5-oeu/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..52ed826f3dba2c35c501396b3fe0ee73addc425b Binary files /dev/null and b/dreamedit_official_ckpt/dog5-oeu/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog5-oeu/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog5-oeu/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c6e920f28740cb14048714d31429c02595539c45 Binary files /dev/null and b/dreamedit_official_ckpt/dog5-oeu/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog5-oeu/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog5-oeu/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5e52464d2a36023a18e1950d5cd964fb79de99aa Binary files /dev/null and b/dreamedit_official_ckpt/dog5-oeu/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog5-oeu/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog5-oeu/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..19ca0e8648c0a53fc1eb62ba6d3799e280981fbd Binary files /dev/null and b/dreamedit_official_ckpt/dog5-oeu/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog5-oeu/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog5-oeu/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..2a7217dcf21230634163ece5e17d786a891f6bbc Binary files /dev/null and b/dreamedit_official_ckpt/dog5-oeu/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog6-dfn/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog6-dfn/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..bc56280cf03bb285771b21f094667d445cea3c3b --- /dev/null +++ b/dreamedit_official_ckpt/dog6-dfn/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e76fd16b7765825e0a7bea1ca5d11f413617493e7ccbc2e7e79fe56c5f2cb2 +size 12126699506 diff --git a/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-lightning.yaml b/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..447a5bcab7ab5a559636440b22776a41d6cf3b17 --- /dev/null +++ b/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 3, diff --git a/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-project.yaml b/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..dd5bb98387df4c85a8e138cd7fe6974411c3a972 --- /dev/null +++ b/dreamedit_official_ckpt/dog6-dfn/configs/dog62023-04-17T00-55-18-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: dfn + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog6-dfn/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog6-dfn/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..bf2a6955e99bddcbb1f37805c51ef7995a763f33 Binary files /dev/null and b/dreamedit_official_ckpt/dog6-dfn/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog6-dfn/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog6-dfn/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..555dc8ddc34ec29c0d4327f634bdb2a0428e6c88 Binary files /dev/null and b/dreamedit_official_ckpt/dog6-dfn/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog6-dfn/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog6-dfn/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..339be5f01cedb2778a7efd9861421ed44cec7267 Binary files /dev/null and b/dreamedit_official_ckpt/dog6-dfn/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog6-dfn/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog6-dfn/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..f6a2496a981dc21feec3b3e3c3fe8b8586425542 Binary files /dev/null and b/dreamedit_official_ckpt/dog6-dfn/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog6-dfn/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog6-dfn/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..e3898cb6a3c61713878a438242dc2f6ab0c7f354 Binary files /dev/null and b/dreamedit_official_ckpt/dog6-dfn/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog7-fwq/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog7-fwq/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..0b57c3e4513572e7822441eabd774283c067a608 --- /dev/null +++ b/dreamedit_official_ckpt/dog7-fwq/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ffd4508fec93e3225695ad697531c403896633771136f44debbef07b29b5a5 +size 12126699506 diff --git a/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-lightning.yaml b/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..c8a0979811d476d52f2ef60fcdfa6cc5ec4ae750 --- /dev/null +++ b/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 5, diff --git a/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-project.yaml b/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..85dfa39cd71b8526351928a58d35361221df8a36 --- /dev/null +++ b/dreamedit_official_ckpt/dog7-fwq/configs/dog72023-04-17T00-56-32-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: fwq + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog7-fwq/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog7-fwq/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..bbb80cc106042adfc0ffe663a15d045027036fde Binary files /dev/null and b/dreamedit_official_ckpt/dog7-fwq/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog7-fwq/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog7-fwq/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..41030c99e8c84b7449df194b8598b19b3cffca17 Binary files /dev/null and b/dreamedit_official_ckpt/dog7-fwq/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog7-fwq/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog7-fwq/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..983421a8a4c20e7401df93fb23dd5026995cf882 Binary files /dev/null and b/dreamedit_official_ckpt/dog7-fwq/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog7-fwq/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog7-fwq/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..4575c7d53dc1350ea1e6342e2e475a5aae3fd0c2 Binary files /dev/null and b/dreamedit_official_ckpt/dog7-fwq/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog7-fwq/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog7-fwq/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..beb675042b79bbae368f54aa759991be9d1095bc Binary files /dev/null and b/dreamedit_official_ckpt/dog7-fwq/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog8-wie/checkpoints/last.ckpt b/dreamedit_official_ckpt/dog8-wie/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..b5cd6312d479c85497b23009b107cf0d9df0b348 --- /dev/null +++ b/dreamedit_official_ckpt/dog8-wie/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddab830c831c5bcb622bb1913910c05eb479231c98e24f1b8bcd229cbf8fb3b +size 12126699506 diff --git a/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-lightning.yaml b/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..67452d0424c3cbea07d0c7a9e8a8018d2baa3b9b --- /dev/null +++ b/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 6, diff --git a/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-project.yaml b/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..4e76ab29c897e4b90b253733b10061cfb4ed02e3 --- /dev/null +++ b/dreamedit_official_ckpt/dog8-wie/configs/dog82023-04-17T00-58-03-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: wie + placeholder_token: dog + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: dog + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: dog diff --git a/dreamedit_official_ckpt/dog8-wie/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog8-wie/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7d55a9500fdc96dba2e5a2d2d4e12873058ca5fb Binary files /dev/null and b/dreamedit_official_ckpt/dog8-wie/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog8-wie/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog8-wie/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..0c4933af0a5e6cad421086efa441a04191abac69 Binary files /dev/null and b/dreamedit_official_ckpt/dog8-wie/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog8-wie/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog8-wie/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..da1e70d3912cf74588b0e0815ff9c33891414b58 Binary files /dev/null and b/dreamedit_official_ckpt/dog8-wie/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog8-wie/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog8-wie/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..ef89af8f47b83c302f1b9ddd720382213b982593 Binary files /dev/null and b/dreamedit_official_ckpt/dog8-wie/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/dog8-wie/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/dog8-wie/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..ee352c184e18b9f995c9345171f87fa1735bfdf1 Binary files /dev/null and b/dreamedit_official_ckpt/dog8-wie/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/duck_toy-oeb/checkpoints/last.ckpt b/dreamedit_official_ckpt/duck_toy-oeb/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..63f2b09752cb540c3e8dc75a4f9d873aef179a1c --- /dev/null +++ b/dreamedit_official_ckpt/duck_toy-oeb/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c610f34a9867d4776a429ad9d74c9a947986011914b9ffd57b416a50add6da5 +size 12126699889 diff --git a/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-lightning.yaml b/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..1e71187c01f2747bb12107efc9bffe81ce8fafc7 --- /dev/null +++ b/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 1, diff --git a/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-project.yaml b/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..0185cde2e1c7d6f9f24c0d230e2fa83854526b10 --- /dev/null +++ b/dreamedit_official_ckpt/duck_toy-oeb/configs/duck_toy2023-04-17T02-02-20-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: oeb + placeholder_token: duck toy + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: duck toy + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: duck toy diff --git a/dreamedit_official_ckpt/duck_toy-oeb/images/train/conditioning_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/duck_toy-oeb/images/train/conditioning_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..40eb0b9061f6cf07c60ca13eb1fbd1e0d980ccaf Binary files /dev/null and b/dreamedit_official_ckpt/duck_toy-oeb/images/train/conditioning_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/duck_toy-oeb/images/train/inputs_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/duck_toy-oeb/images/train/inputs_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5ae8e79dd15d83ae1fe97c008732a3a3618ad768 Binary files /dev/null and b/dreamedit_official_ckpt/duck_toy-oeb/images/train/inputs_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/duck_toy-oeb/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/duck_toy-oeb/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..43e33efb803c00fb84290c30d1396f3787ac8f76 Binary files /dev/null and b/dreamedit_official_ckpt/duck_toy-oeb/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..e4fc46ae34a8ea8a223c9bb2895eddd7d220e65d Binary files /dev/null and b/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..75f86d46956eced9471d643a04c1d8982ab55abc Binary files /dev/null and b/dreamedit_official_ckpt/duck_toy-oeb/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/fancy_boot-upd/checkpoints/last.ckpt b/dreamedit_official_ckpt/fancy_boot-upd/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..2b6c636be45c0c0dda9dea9e7828dc4821323e3f --- /dev/null +++ b/dreamedit_official_ckpt/fancy_boot-upd/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d69139a42aae2a99d4db1477b6693c79bcfa27e548e2ab336274f3ef1b15a2 +size 12126699889 diff --git a/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-lightning.yaml b/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..75133130d454a72424ce6d28a7f8246b5706b028 --- /dev/null +++ b/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 2, diff --git a/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-project.yaml b/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..313b2bd3b6b0e8851240ad872d1aa82bbb57f8e6 --- /dev/null +++ b/dreamedit_official_ckpt/fancy_boot-upd/configs/fancy_boot2023-04-17T02-27-44-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: upd + placeholder_token: fancy boot + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: fancy boot + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: fancy boot diff --git a/dreamedit_official_ckpt/fancy_boot-upd/images/train/conditioning_gs-000500_e-000001_b-000010.jpg b/dreamedit_official_ckpt/fancy_boot-upd/images/train/conditioning_gs-000500_e-000001_b-000010.jpg new file mode 100755 index 0000000000000000000000000000000000000000..fd920b0ff01fab942cdbbc66a341b42225157598 Binary files /dev/null and b/dreamedit_official_ckpt/fancy_boot-upd/images/train/conditioning_gs-000500_e-000001_b-000010.jpg differ diff --git a/dreamedit_official_ckpt/fancy_boot-upd/images/train/inputs_gs-000500_e-000001_b-000010.jpg b/dreamedit_official_ckpt/fancy_boot-upd/images/train/inputs_gs-000500_e-000001_b-000010.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7ff3872c229a027edd8d9869fb8fba271c6f4c5a Binary files /dev/null and b/dreamedit_official_ckpt/fancy_boot-upd/images/train/inputs_gs-000500_e-000001_b-000010.jpg differ diff --git a/dreamedit_official_ckpt/fancy_boot-upd/images/train/reconstruction_gs-000500_e-000001_b-000010.jpg b/dreamedit_official_ckpt/fancy_boot-upd/images/train/reconstruction_gs-000500_e-000001_b-000010.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9960e68a56e49937ad4cd1cb80c6467b3ea97231 Binary files /dev/null and b/dreamedit_official_ckpt/fancy_boot-upd/images/train/reconstruction_gs-000500_e-000001_b-000010.jpg differ diff --git a/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_gs-000500_e-000001_b-000010.jpg b/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_gs-000500_e-000001_b-000010.jpg new file mode 100755 index 0000000000000000000000000000000000000000..1c02892ec4b277a98698ce0bbd32f8b70bc979a5 Binary files /dev/null and b/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_gs-000500_e-000001_b-000010.jpg differ diff --git a/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_scaled_gs-000500_e-000001_b-000010.jpg b/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_scaled_gs-000500_e-000001_b-000010.jpg new file mode 100755 index 0000000000000000000000000000000000000000..e78389902e602ba5fb0bb7dbdaf560d1a47cfd14 Binary files /dev/null and b/dreamedit_official_ckpt/fancy_boot-upd/images/train/samples_scaled_gs-000500_e-000001_b-000010.jpg differ diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/checkpoints/last.ckpt b/dreamedit_official_ckpt/grey_sloth_plushie-xha/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..b8a5fdb73e25748e1f8a7082ea3d0bd993c1b8dd --- /dev/null +++ b/dreamedit_official_ckpt/grey_sloth_plushie-xha/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c478a32b778392f73c5bf1514d46508aa169b6d808635cf3fbdedab18d317836 +size 12126699953 diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-lightning.yaml b/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..447a5bcab7ab5a559636440b22776a41d6cf3b17 --- /dev/null +++ b/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 3, diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-project.yaml b/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..4337314d3bed43c15f23c2410180cfce3f450017 --- /dev/null +++ b/dreamedit_official_ckpt/grey_sloth_plushie-xha/configs/grey_sloth_plushie2023-04-17T02-06-50-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: xha + placeholder_token: grey sloth plushie + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: grey sloth plushie + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: grey sloth plushie diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/conditioning_gs-000500_e-000001_b-000060.jpg b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/conditioning_gs-000500_e-000001_b-000060.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5ca5563e3c60801403b51c9f6491931925553a66 Binary files /dev/null and b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/conditioning_gs-000500_e-000001_b-000060.jpg differ diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/inputs_gs-000500_e-000001_b-000060.jpg b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/inputs_gs-000500_e-000001_b-000060.jpg new file mode 100755 index 0000000000000000000000000000000000000000..b1b73b5334abc8be5d7e2b153d983209c7a7a5eb Binary files /dev/null and b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/inputs_gs-000500_e-000001_b-000060.jpg differ diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/reconstruction_gs-000500_e-000001_b-000060.jpg b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/reconstruction_gs-000500_e-000001_b-000060.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c5af85eb84b545d1d9291c83647948d172ffa21a Binary files /dev/null and b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/reconstruction_gs-000500_e-000001_b-000060.jpg differ diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_gs-000500_e-000001_b-000060.jpg b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_gs-000500_e-000001_b-000060.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9050cf8d87fa8675a1bdd83ab060ff3b27fbe061 Binary files /dev/null and b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_gs-000500_e-000001_b-000060.jpg differ diff --git a/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_scaled_gs-000500_e-000001_b-000060.jpg b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_scaled_gs-000500_e-000001_b-000060.jpg new file mode 100755 index 0000000000000000000000000000000000000000..b98724fba45ac1a7b166ca87f152abfeb9813b72 Binary files /dev/null and b/dreamedit_official_ckpt/grey_sloth_plushie-xha/images/train/samples_scaled_gs-000500_e-000001_b-000060.jpg differ diff --git a/dreamedit_official_ckpt/monster_toy-vka/checkpoints/last.ckpt b/dreamedit_official_ckpt/monster_toy-vka/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..ff9331a97717dae242f6e644a6ecc33a1c734329 --- /dev/null +++ b/dreamedit_official_ckpt/monster_toy-vka/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b83fad41738735a2723c421ed5592b2e77edbb5960283e62330f91a4ad9aeb0 +size 12126699506 diff --git a/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-lightning.yaml b/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..86a4212d937ea1b90a03322341249a5095fc6559 --- /dev/null +++ b/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 4, diff --git a/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-project.yaml b/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..de2f5387b77efc407b461bd81180aa749e91487d --- /dev/null +++ b/dreamedit_official_ckpt/monster_toy-vka/configs/monster_toy2023-04-17T02-12-12-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: vka + placeholder_token: monster toy + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: monster toy + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: monster toy diff --git a/dreamedit_official_ckpt/monster_toy-vka/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/monster_toy-vka/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a8dcadb49828e64866acb8f90a0be6fec6cde198 Binary files /dev/null and b/dreamedit_official_ckpt/monster_toy-vka/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/monster_toy-vka/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/monster_toy-vka/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..b6302514dfa080229d190be3b1a7cc59229e907f Binary files /dev/null and b/dreamedit_official_ckpt/monster_toy-vka/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/monster_toy-vka/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/monster_toy-vka/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c6360d2939b80d7377fbe5eb329d77c59d1d8ef7 Binary files /dev/null and b/dreamedit_official_ckpt/monster_toy-vka/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..5d063da3e95b1b9bc2ab981bfb633c28f19ee305 Binary files /dev/null and b/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..0305a3da699f6bddec16343dd11af3becc91b96f Binary files /dev/null and b/dreamedit_official_ckpt/monster_toy-vka/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/checkpoints/last.ckpt b/dreamedit_official_ckpt/pink_sunglasses-rsm/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..123068e2614e4be41a72e2672ffa7836efb828b6 --- /dev/null +++ b/dreamedit_official_ckpt/pink_sunglasses-rsm/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1c77951c83c0630df97aa2e1aa5986b11a4ea1ecb4e49705cd42696fd6e782 +size 12126699889 diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-lightning.yaml b/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..c8a0979811d476d52f2ef60fcdfa6cc5ec4ae750 --- /dev/null +++ b/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 5, diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-project.yaml b/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..e96ee80b47437b769539909d6145bfcc969fbb4f --- /dev/null +++ b/dreamedit_official_ckpt/pink_sunglasses-rsm/configs/pink_sunglasses2023-04-17T02-18-04-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: rsm + placeholder_token: sunglasses + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: sunglasses + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: sunglasses diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/conditioning_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/conditioning_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a6ac335caf49d3e6dcdafc9664ed04bb27575efb Binary files /dev/null and b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/conditioning_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/inputs_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/inputs_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..3fe378a7a40d36e1b471d9fa26a660aece4d680e Binary files /dev/null and b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/inputs_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..058f81b1182eb081716b0fef38dfa60c019ccc13 Binary files /dev/null and b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..3f579a8ab8cb79f6784341554639597486e8d94b Binary files /dev/null and b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..fc3b2dd2dd81d0e682bde44f0ed6d882c62ba835 Binary files /dev/null and b/dreamedit_official_ckpt/pink_sunglasses-rsm/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/checkpoints/last.ckpt b/dreamedit_official_ckpt/poop_emoji-dzs/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..4394b6f1548f0c4c89b03cd2dcbd9d5e80fe253e --- /dev/null +++ b/dreamedit_official_ckpt/poop_emoji-dzs/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e261884f70f2d73528753e89935c4de0fe421c372352813f05d39c08e53b6703 +size 12126699889 diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-lightning.yaml b/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..67452d0424c3cbea07d0c7a9e8a8018d2baa3b9b --- /dev/null +++ b/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 6, diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-project.yaml b/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..958035a86d2f0621aeea85af5ca747ba80f6ea6d --- /dev/null +++ b/dreamedit_official_ckpt/poop_emoji-dzs/configs/poop_emoji2023-04-17T02-25-27-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: dzs + placeholder_token: poop emoji + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: poop emoji + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: poop emoji diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/images/train/conditioning_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/conditioning_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..84f0e875cf6f5d53c969b6b935f623e0e85faf84 Binary files /dev/null and b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/conditioning_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/images/train/inputs_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/inputs_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..ed3595bd6f3c309f7bceb9b3c04bc43c4064b97e Binary files /dev/null and b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/inputs_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..6f8e2127813aeb5a89b5ded12e95e115f79140af Binary files /dev/null and b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..029f85917747900cdc9ead0c6928429159f7fa54 Binary files /dev/null and b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..781e3d579bb0674bfe39baffc8cbad763497c130 Binary files /dev/null and b/dreamedit_official_ckpt/poop_emoji-dzs/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/rc_car-gbp/checkpoints/last.ckpt b/dreamedit_official_ckpt/rc_car-gbp/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..a789c662342f7c70212a599811e2ab00d5173889 --- /dev/null +++ b/dreamedit_official_ckpt/rc_car-gbp/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abfbd02685f2613dc1e1c0e1f86dcfde11b2a0b983b037ed3369c78f06a45d86 +size 12126699889 diff --git a/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-lightning.yaml b/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..61207c460869b84259f33ce640b420b181231d9c --- /dev/null +++ b/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 7, diff --git a/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-project.yaml b/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..bdc2284867dc47631463f0007fee9c06ee795983 --- /dev/null +++ b/dreamedit_official_ckpt/rc_car-gbp/configs/rc_car2023-04-17T02-31-20-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: gbp + placeholder_token: car toy + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: car toy + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: car toy diff --git a/dreamedit_official_ckpt/rc_car-gbp/images/train/conditioning_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/rc_car-gbp/images/train/conditioning_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..fe8e101bbb170251fcc5b3980651edfe50b45406 Binary files /dev/null and b/dreamedit_official_ckpt/rc_car-gbp/images/train/conditioning_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/rc_car-gbp/images/train/inputs_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/rc_car-gbp/images/train/inputs_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a630066c9104cfe9bf96a8bbcb848ef3c87b2b18 Binary files /dev/null and b/dreamedit_official_ckpt/rc_car-gbp/images/train/inputs_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/rc_car-gbp/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/rc_car-gbp/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..e3867afd71e8380fd18d5835dcb342dcda8c770b Binary files /dev/null and b/dreamedit_official_ckpt/rc_car-gbp/images/train/reconstruction_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..4ff0d965f89b3eb6fb86ec17bb18eb4eacf0012d Binary files /dev/null and b/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg b/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg new file mode 100755 index 0000000000000000000000000000000000000000..757b1998832b25faf4da4126e73b3d1823c9b9b8 Binary files /dev/null and b/dreamedit_official_ckpt/rc_car-gbp/images/train/samples_scaled_gs-000500_e-000001_b-000110.jpg differ diff --git a/dreamedit_official_ckpt/red_cartoon-jle/checkpoints/last.ckpt b/dreamedit_official_ckpt/red_cartoon-jle/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..8ed5219bc29e3f7ca48b05ec1a359a50214225a3 --- /dev/null +++ b/dreamedit_official_ckpt/red_cartoon-jle/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d740955f0c71933a3e72579f9d8604ccf15a904993da140ab19b832a6867793 +size 12126699889 diff --git a/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-lightning.yaml b/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..916cc386ab080a09312aee9ce29a611b61e2448a --- /dev/null +++ b/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 0, diff --git a/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-project.yaml b/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..652d724467c2a764c43803dc070ffbc9cbefb641 --- /dev/null +++ b/dreamedit_official_ckpt/red_cartoon-jle/configs/red_cartoon2023-04-17T02-32-58-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: jle + placeholder_token: cartoon devil + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: cartoon devil + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: cartoon devil diff --git a/dreamedit_official_ckpt/red_cartoon-jle/images/train/conditioning_gs-000500_e-000001_b-000200.jpg b/dreamedit_official_ckpt/red_cartoon-jle/images/train/conditioning_gs-000500_e-000001_b-000200.jpg new file mode 100755 index 0000000000000000000000000000000000000000..37b0f5e41b2715508ebab301fa562b1ba2df418c Binary files /dev/null and b/dreamedit_official_ckpt/red_cartoon-jle/images/train/conditioning_gs-000500_e-000001_b-000200.jpg differ diff --git a/dreamedit_official_ckpt/red_cartoon-jle/images/train/inputs_gs-000500_e-000001_b-000200.jpg b/dreamedit_official_ckpt/red_cartoon-jle/images/train/inputs_gs-000500_e-000001_b-000200.jpg new file mode 100755 index 0000000000000000000000000000000000000000..f2caf40e231c914c47c5b2807fc0f8068d739261 Binary files /dev/null and b/dreamedit_official_ckpt/red_cartoon-jle/images/train/inputs_gs-000500_e-000001_b-000200.jpg differ diff --git a/dreamedit_official_ckpt/red_cartoon-jle/images/train/reconstruction_gs-000500_e-000001_b-000200.jpg b/dreamedit_official_ckpt/red_cartoon-jle/images/train/reconstruction_gs-000500_e-000001_b-000200.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7719dff40b6de15f3e7c73740965f949fbaa785e Binary files /dev/null and b/dreamedit_official_ckpt/red_cartoon-jle/images/train/reconstruction_gs-000500_e-000001_b-000200.jpg differ diff --git a/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_gs-000500_e-000001_b-000200.jpg b/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_gs-000500_e-000001_b-000200.jpg new file mode 100755 index 0000000000000000000000000000000000000000..0ccdd002be8fa33f62bfdafb36137a82bd8696df Binary files /dev/null and b/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_gs-000500_e-000001_b-000200.jpg differ diff --git a/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_scaled_gs-000500_e-000001_b-000200.jpg b/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_scaled_gs-000500_e-000001_b-000200.jpg new file mode 100755 index 0000000000000000000000000000000000000000..3bbd1b1265a9bd8ef0adbd2c84782f69f0cd05ad Binary files /dev/null and b/dreamedit_official_ckpt/red_cartoon-jle/images/train/samples_scaled_gs-000500_e-000001_b-000200.jpg differ diff --git a/dreamedit_official_ckpt/robot_toy-oxp/checkpoints/last.ckpt b/dreamedit_official_ckpt/robot_toy-oxp/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..d483f5f06ef7d541c5460f2430ee04475f5f09f2 --- /dev/null +++ b/dreamedit_official_ckpt/robot_toy-oxp/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e103ed197ec245ba74128e887df9630491a011147ce33f1d462e5c3cdf9aa4 +size 12126699889 diff --git a/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-lightning.yaml b/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..1e71187c01f2747bb12107efc9bffe81ce8fafc7 --- /dev/null +++ b/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 1, diff --git a/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-project.yaml b/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..dd12cf08222875b116fea37d70d6c9d70a949933 --- /dev/null +++ b/dreamedit_official_ckpt/robot_toy-oxp/configs/robot_toy2023-04-17T02-51-28-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: oxp + placeholder_token: robot toy + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: robot toy + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: robot toy diff --git a/dreamedit_official_ckpt/robot_toy-oxp/images/train/conditioning_gs-000500_e-000001_b-000170.jpg b/dreamedit_official_ckpt/robot_toy-oxp/images/train/conditioning_gs-000500_e-000001_b-000170.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a8dba2d10445a617cc3c3901ff41a912d54b3585 Binary files /dev/null and b/dreamedit_official_ckpt/robot_toy-oxp/images/train/conditioning_gs-000500_e-000001_b-000170.jpg differ diff --git a/dreamedit_official_ckpt/robot_toy-oxp/images/train/inputs_gs-000500_e-000001_b-000170.jpg b/dreamedit_official_ckpt/robot_toy-oxp/images/train/inputs_gs-000500_e-000001_b-000170.jpg new file mode 100755 index 0000000000000000000000000000000000000000..2e00898e4af48d2c118f076e731d7044ebcd57f6 Binary files /dev/null and b/dreamedit_official_ckpt/robot_toy-oxp/images/train/inputs_gs-000500_e-000001_b-000170.jpg differ diff --git a/dreamedit_official_ckpt/robot_toy-oxp/images/train/reconstruction_gs-000500_e-000001_b-000170.jpg b/dreamedit_official_ckpt/robot_toy-oxp/images/train/reconstruction_gs-000500_e-000001_b-000170.jpg new file mode 100755 index 0000000000000000000000000000000000000000..4748ece016c33a37d360ad396c7db2528e09ad49 Binary files /dev/null and b/dreamedit_official_ckpt/robot_toy-oxp/images/train/reconstruction_gs-000500_e-000001_b-000170.jpg differ diff --git a/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_gs-000500_e-000001_b-000170.jpg b/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_gs-000500_e-000001_b-000170.jpg new file mode 100755 index 0000000000000000000000000000000000000000..30fa34bda93cfa442c9a1b9890ea1738537e64d4 Binary files /dev/null and b/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_gs-000500_e-000001_b-000170.jpg differ diff --git a/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_scaled_gs-000500_e-000001_b-000170.jpg b/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_scaled_gs-000500_e-000001_b-000170.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7e6e4b2f56d06650c70f253fa4bff53362061c84 Binary files /dev/null and b/dreamedit_official_ckpt/robot_toy-oxp/images/train/samples_scaled_gs-000500_e-000001_b-000170.jpg differ diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/checkpoints/last.ckpt b/dreamedit_official_ckpt/shiny_sneaker-hrw/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..4e5e36013438e8de4624349626c38d3509fa9215 --- /dev/null +++ b/dreamedit_official_ckpt/shiny_sneaker-hrw/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4d0facdc1f9e5d797b9f5f84b8b4838f356752a3b96302ebd4dc38fb77319a +size 12126699889 diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-lightning.yaml b/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..447a5bcab7ab5a559636440b22776a41d6cf3b17 --- /dev/null +++ b/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 3, diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-project.yaml b/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..d9fa124d44832786c6d6c469eda85d3c23a936cb --- /dev/null +++ b/dreamedit_official_ckpt/shiny_sneaker-hrw/configs/shiny_sneaker2023-04-17T02-48-13-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: hrw + placeholder_token: shiny sneaker + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: shiny sneaker + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: shiny sneaker diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/conditioning_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/conditioning_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..d5fef456754972390e801d3be73226e5baf67b2c Binary files /dev/null and b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/conditioning_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/inputs_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/inputs_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7994afc4c98bd94be33e52b26da18fa001e4f30c Binary files /dev/null and b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/inputs_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..429337df092e6c2fb1ff2e5a45aae01ddca4bc1d Binary files /dev/null and b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/reconstruction_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..32a10c78f416dac087fda083982b5217dd322ddb Binary files /dev/null and b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg new file mode 100755 index 0000000000000000000000000000000000000000..a93aa6dbc165a0aba937b024482d65b4e95fbbf5 Binary files /dev/null and b/dreamedit_official_ckpt/shiny_sneaker-hrw/images/train/samples_scaled_gs-000500_e-000001_b-000100.jpg differ diff --git a/dreamedit_official_ckpt/teapot-vfz/checkpoints/last.ckpt b/dreamedit_official_ckpt/teapot-vfz/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..a3bad6433fe3230d03a03e874df6d94210c3f7c6 --- /dev/null +++ b/dreamedit_official_ckpt/teapot-vfz/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143d6d3cb9b361903d0972890eea672817976035c201498f583f681a6e51c709 +size 12126699889 diff --git a/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-lightning.yaml b/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..86a4212d937ea1b90a03322341249a5095fc6559 --- /dev/null +++ b/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 4, diff --git a/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-project.yaml b/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..9fff1f221748ea5c1614da589f488f04f8d07c86 --- /dev/null +++ b/dreamedit_official_ckpt/teapot-vfz/configs/teapot2023-04-17T02-52-47-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: vfz + placeholder_token: teapot + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: teapot + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: teapot diff --git a/dreamedit_official_ckpt/teapot-vfz/images/train/conditioning_gs-000500_e-000001_b-000050.jpg b/dreamedit_official_ckpt/teapot-vfz/images/train/conditioning_gs-000500_e-000001_b-000050.jpg new file mode 100755 index 0000000000000000000000000000000000000000..0b29b6f327fbcc887ec06e02c2711376c4c9d7fd Binary files /dev/null and b/dreamedit_official_ckpt/teapot-vfz/images/train/conditioning_gs-000500_e-000001_b-000050.jpg differ diff --git a/dreamedit_official_ckpt/teapot-vfz/images/train/inputs_gs-000500_e-000001_b-000050.jpg b/dreamedit_official_ckpt/teapot-vfz/images/train/inputs_gs-000500_e-000001_b-000050.jpg new file mode 100755 index 0000000000000000000000000000000000000000..ab98ccef17a434a4cc2494a3338baa7e18afbf21 Binary files /dev/null and b/dreamedit_official_ckpt/teapot-vfz/images/train/inputs_gs-000500_e-000001_b-000050.jpg differ diff --git a/dreamedit_official_ckpt/teapot-vfz/images/train/reconstruction_gs-000500_e-000001_b-000050.jpg b/dreamedit_official_ckpt/teapot-vfz/images/train/reconstruction_gs-000500_e-000001_b-000050.jpg new file mode 100755 index 0000000000000000000000000000000000000000..eefeb02568d6c2273408c1e7af0190fb12031cfe Binary files /dev/null and b/dreamedit_official_ckpt/teapot-vfz/images/train/reconstruction_gs-000500_e-000001_b-000050.jpg differ diff --git a/dreamedit_official_ckpt/teapot-vfz/images/train/samples_gs-000500_e-000001_b-000050.jpg b/dreamedit_official_ckpt/teapot-vfz/images/train/samples_gs-000500_e-000001_b-000050.jpg new file mode 100755 index 0000000000000000000000000000000000000000..30a383bd39d48874a8412ad55f871ac921ea1c7a Binary files /dev/null and b/dreamedit_official_ckpt/teapot-vfz/images/train/samples_gs-000500_e-000001_b-000050.jpg differ diff --git a/dreamedit_official_ckpt/teapot-vfz/images/train/samples_scaled_gs-000500_e-000001_b-000050.jpg b/dreamedit_official_ckpt/teapot-vfz/images/train/samples_scaled_gs-000500_e-000001_b-000050.jpg new file mode 100755 index 0000000000000000000000000000000000000000..06a7abce1f8a81fa9988d1decedcb0bb11a86f35 Binary files /dev/null and b/dreamedit_official_ckpt/teapot-vfz/images/train/samples_scaled_gs-000500_e-000001_b-000050.jpg differ diff --git a/dreamedit_official_ckpt/vase-ulc/checkpoints/last.ckpt b/dreamedit_official_ckpt/vase-ulc/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..933e4ddfcd0f0a14ab041b72588345af1a43d64b --- /dev/null +++ b/dreamedit_official_ckpt/vase-ulc/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce7fb7dd5db068939734eeb6df4f9ad3cb673dd372a6354447162337ac60c810 +size 12126699506 diff --git a/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-lightning.yaml b/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..c8a0979811d476d52f2ef60fcdfa6cc5ec4ae750 --- /dev/null +++ b/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 5, diff --git a/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-project.yaml b/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..e045d8def8c01b41abe751be7df50d963e307fe0 --- /dev/null +++ b/dreamedit_official_ckpt/vase-ulc/configs/vase2023-04-17T02-53-31-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: ulc + placeholder_token: vase + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: vase + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: vase diff --git a/dreamedit_official_ckpt/vase-ulc/images/train/conditioning_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/vase-ulc/images/train/conditioning_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..2d61487ef504de9fe4cdd37e6835e33b4a923800 Binary files /dev/null and b/dreamedit_official_ckpt/vase-ulc/images/train/conditioning_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/vase-ulc/images/train/inputs_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/vase-ulc/images/train/inputs_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..eeb3f2365a74c414265ff19e9675ae50e411f525 Binary files /dev/null and b/dreamedit_official_ckpt/vase-ulc/images/train/inputs_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/vase-ulc/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/vase-ulc/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..cfb9465f1d73eaedbf5d74914fcd98c441fb52e1 Binary files /dev/null and b/dreamedit_official_ckpt/vase-ulc/images/train/reconstruction_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/vase-ulc/images/train/samples_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/vase-ulc/images/train/samples_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..fa29aefa72d58c03f1c475110b610cbc2461c0d7 Binary files /dev/null and b/dreamedit_official_ckpt/vase-ulc/images/train/samples_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/vase-ulc/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg b/dreamedit_official_ckpt/vase-ulc/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg new file mode 100755 index 0000000000000000000000000000000000000000..dbf25196fccc1b320396c4b2cba6be8fb34adb3b Binary files /dev/null and b/dreamedit_official_ckpt/vase-ulc/images/train/samples_scaled_gs-000500_e-000001_b-000000.jpg differ diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/checkpoints/last.ckpt b/dreamedit_official_ckpt/wolf_plushie-fxg/checkpoints/last.ckpt new file mode 100755 index 0000000000000000000000000000000000000000..2d33c06001cadb7df1c7962676943831bce4f409 --- /dev/null +++ b/dreamedit_official_ckpt/wolf_plushie-fxg/checkpoints/last.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fb5a6e60e1d2a236eb69de80baae50bd2fd921359707e73dff11eea290bcf5 +size 12126699889 diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-lightning.yaml b/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-lightning.yaml new file mode 100755 index 0000000000000000000000000000000000000000..67452d0424c3cbea07d0c7a9e8a8018d2baa3b9b --- /dev/null +++ b/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-lightning.yaml @@ -0,0 +1,16 @@ +lightning: + modelcheckpoint: + params: + every_n_train_steps: 500 + callbacks: + image_logger: + target: main.ImageLogger + params: + batch_frequency: 500 + max_images: 8 + increase_log_steps: false + trainer: + benchmark: true + max_steps: 800 + accelerator: ddp + gpus: 6, diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-project.yaml b/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-project.yaml new file mode 100755 index 0000000000000000000000000000000000000000..3ac7040249ef6b7125ae68301034a0f12319c4a0 --- /dev/null +++ b/dreamedit_official_ckpt/wolf_plushie-fxg/configs/wolf_plushie2023-04-17T02-55-24-project.yaml @@ -0,0 +1,112 @@ +model: + base_learning_rate: 1.0e-06 + target: ldm.models.diffusion.ddpm.LatentDiffusion + params: + reg_weight: 1.0 + linear_start: 0.00085 + linear_end: 0.012 + num_timesteps_cond: 1 + log_every_t: 200 + timesteps: 1000 + first_stage_key: image + cond_stage_key: caption + image_size: 64 + channels: 4 + cond_stage_trainable: true + conditioning_key: crossattn + monitor: val/loss_simple_ema + scale_factor: 0.18215 + use_ema: false + embedding_reg_weight: 0.0 + unfreeze_model: true + model_lr: 1.0e-06 + personalization_config: + target: ldm.modules.embedding_manager.EmbeddingManager + params: + placeholder_strings: + - '*' + initializer_words: + - sculpture + per_image_tokens: false + num_vectors_per_token: 1 + progressive_words: false + unet_config: + target: ldm.modules.diffusionmodules.openaimodel.UNetModel + params: + image_size: 32 + in_channels: 4 + out_channels: 4 + model_channels: 320 + attention_resolutions: + - 4 + - 2 + - 1 + num_res_blocks: 2 + channel_mult: + - 1 + - 2 + - 4 + - 4 + num_heads: 8 + use_spatial_transformer: true + transformer_depth: 1 + context_dim: 768 + use_checkpoint: true + legacy: false + first_stage_config: + target: ldm.models.autoencoder.AutoencoderKL + params: + embed_dim: 4 + monitor: val/rec_loss + ddconfig: + double_z: true + z_channels: 4 + resolution: 512 + in_channels: 3 + out_ch: 3 + ch: 128 + ch_mult: + - 1 + - 2 + - 4 + - 4 + num_res_blocks: 2 + attn_resolutions: [] + dropout: 0.0 + lossconfig: + target: torch.nn.Identity + cond_stage_config: + target: ldm.modules.encoders.modules.FrozenCLIPEmbedder + ckpt_path: stable-diffusion-v-1-4-original/sd-v1-4-full-ema.ckpt +data: + target: main.DataModuleFromConfig + params: + batch_size: 1 + num_workers: 2 + wrap: false + train: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + per_image_tokens: false + repeats: 100 + special_token: fxg + placeholder_token: wolf plushie + reg: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: train + reg: true + per_image_tokens: false + repeats: 10 + placeholder_token: wolf plushie + validation: + target: ldm.data.personalized.PersonalizedBase + params: + size: 512 + set: val + per_image_tokens: false + repeats: 10 + placeholder_token: wolf plushie diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/conditioning_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/conditioning_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..615e9beb573442a18863723fec80724e6eab0b68 Binary files /dev/null and b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/conditioning_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/inputs_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/inputs_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..cb72b994b4c9849a007cc320e1eee7b37c314512 Binary files /dev/null and b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/inputs_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..9fee2c25d7514465c5850bef984381090890af73 Binary files /dev/null and b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/reconstruction_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..7d929caf8cbe54dac8f6bc291b78ce000bb57e10 Binary files /dev/null and b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_gs-000500_e-000001_b-000020.jpg differ diff --git a/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg new file mode 100755 index 0000000000000000000000000000000000000000..c6659abb5378eec56ecb0b284137fca527eb3aa9 Binary files /dev/null and b/dreamedit_official_ckpt/wolf_plushie-fxg/images/train/samples_scaled_gs-000500_e-000001_b-000020.jpg differ