laion
/

DALLE2-PyTorch

Model card Files Files and versions Community

rom1504 commited on Jul 4, 2022

Commit

249b307

1 Parent(s): 9df49c1

Update decoder_config.json

Browse files

Files changed (1) hide show

decoder_config.json +13 -13

decoder_config.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "decoder": {
         "unets": [
             {
-                "dim": 256,
                 "cond_dim": 512,
                 "image_embed_dim": 768,
                 "text_embed_dim": 768,
@@ -15,8 +15,7 @@
                 "attn_heads": 8,
                 "attn_dim_head": 64,
                 "sparse_attn": true,
-                "memory_efficient": true,
-		        "self_attn": [false, true, true, true]
             }
         ],
         "clip": {
@@ -34,7 +33,7 @@
         "webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion-aesthetic/data/laion2B-en-aesthetic/{}.tar -",
         "embeddings_url": "s3://s-datasets/laion-aesthetic/ordered_embeddings/",
         "num_workers": 12,
-        "batch_size": 60,
         "start_shard": 0,
         "end_shard": 5247,
         "shard_width": 5,
@@ -60,10 +59,10 @@
         "lr":1e-4,
         "wd": 0.01,
         "max_grad_norm": 0.5,
-        "save_every_n_samples": 2000000,
         "n_sample_images": 10,
         "device": "cuda:0",
-        "epoch_samples": 40000000,
         "validation_samples": 100000,
         "use_ema": true,
         "ema_beta": 0.99,
@@ -89,17 +88,19 @@
         "log": {
             "log_type": "wandb",
-            "wandb_entity": "rom1504",
             "wandb_project": "dalle2_train_decoder",
-            "wandb_resume": false,
             "verbose": true
         },
         "load": {
-	    "resume": true,
             "load_from": "url",
-            "url": "https://api.wandb.ai/files/rom1504/dalle2_train_decoder/3tmnv289/latest.pth"
         },
         "save": [{
@@ -109,10 +110,9 @@
             "save_to": "huggingface",
             "huggingface_repo": "laion/DALLE2-PyTorch",
-            "save_latest_to": "decoder/small_32gpus/latest.pth",
             "save_type": "model"
         }]
     }
-}

     "decoder": {
         "unets": [
             {
+                "dim": 416,
                 "cond_dim": 512,
                 "image_embed_dim": 768,
                 "text_embed_dim": 768,
                 "attn_heads": 8,
                 "attn_dim_head": 64,
                 "sparse_attn": true,
+                "memory_efficient": true
             }
         ],
         "clip": {
         "webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion-aesthetic/data/laion2B-en-aesthetic/{}.tar -",
         "embeddings_url": "s3://s-datasets/laion-aesthetic/ordered_embeddings/",
         "num_workers": 12,
+        "batch_size": 21,
         "start_shard": 0,
         "end_shard": 5247,
         "shard_width": 5,
         "lr":1e-4,
         "wd": 0.01,
         "max_grad_norm": 0.5,
+        "save_every_n_samples": 200000,
         "n_sample_images": 10,
         "device": "cuda:0",
+        "epoch_samples": 2000000,
         "validation_samples": 100000,
         "use_ema": true,
         "ema_beta": 0.99,
         "log": {
             "log_type": "wandb",
+            "wandb_entity": "nousr_laion",
             "wandb_project": "dalle2_train_decoder",
+            "wandb_run_id": "5ojoz4bw",
+            "wandb_resume": true,
             "verbose": true
         },
         "load": {
             "load_from": "url",
+            "url": "https://huggingface.co/Veldrovive/test_model/resolve/main/eu_latest_checkpoint2.pth"
         },
         "save": [{
             "save_to": "huggingface",
             "huggingface_repo": "laion/DALLE2-PyTorch",
+            "save_latest_to": "latest_{epoch}.pth",
             "save_type": "model"
         }]
     }
+}