Upload decoder_config.json with huggingface_hub
Browse files- decoder_config.json +10 -9
decoder_config.json
CHANGED
@@ -56,8 +56,8 @@
|
|
56 |
},
|
57 |
"train": {
|
58 |
"epochs": 1000,
|
59 |
-
"lr":
|
60 |
-
"wd": 0.
|
61 |
"max_grad_norm": 0.5,
|
62 |
"save_every_n_samples": 200000,
|
63 |
"n_sample_images": 10,
|
@@ -65,8 +65,7 @@
|
|
65 |
"epoch_samples": 2000000,
|
66 |
"validation_samples": 100000,
|
67 |
"use_ema": true,
|
68 |
-
"ema_beta": 0.
|
69 |
-
"ema_inv_gamma":0.75,
|
70 |
"save_all": false,
|
71 |
"save_latest": true,
|
72 |
"save_best": true,
|
@@ -92,11 +91,15 @@
|
|
92 |
"wandb_entity": "nousr_laion",
|
93 |
"wandb_project": "dalle2_train_decoder",
|
94 |
|
|
|
|
|
|
|
95 |
"verbose": true
|
96 |
},
|
97 |
|
98 |
"load": {
|
99 |
-
"load_from":
|
|
|
100 |
},
|
101 |
|
102 |
"save": [{
|
@@ -106,10 +109,8 @@
|
|
106 |
"save_to": "huggingface",
|
107 |
"huggingface_repo": "laion/DALLE2-PyTorch",
|
108 |
|
109 |
-
"
|
110 |
-
|
111 |
-
"save_best": true,
|
112 |
-
|
113 |
"save_type": "model"
|
114 |
}]
|
115 |
}
|
|
|
56 |
},
|
57 |
"train": {
|
58 |
"epochs": 1000,
|
59 |
+
"lr":1e-4,
|
60 |
+
"wd": 0.01,
|
61 |
"max_grad_norm": 0.5,
|
62 |
"save_every_n_samples": 200000,
|
63 |
"n_sample_images": 10,
|
|
|
65 |
"epoch_samples": 2000000,
|
66 |
"validation_samples": 100000,
|
67 |
"use_ema": true,
|
68 |
+
"ema_beta": 0.99,
|
|
|
69 |
"save_all": false,
|
70 |
"save_latest": true,
|
71 |
"save_best": true,
|
|
|
91 |
"wandb_entity": "nousr_laion",
|
92 |
"wandb_project": "dalle2_train_decoder",
|
93 |
|
94 |
+
"wandb_run_id": "5ojoz4bw",
|
95 |
+
"wandb_resume": true,
|
96 |
+
|
97 |
"verbose": true
|
98 |
},
|
99 |
|
100 |
"load": {
|
101 |
+
"load_from": "wandb",
|
102 |
+
"wandb_file_path": "latest.pth"
|
103 |
},
|
104 |
|
105 |
"save": [{
|
|
|
109 |
"save_to": "huggingface",
|
110 |
"huggingface_repo": "laion/DALLE2-PyTorch",
|
111 |
|
112 |
+
"save_latest_to": "latest_{epoch}.pth",
|
113 |
+
|
|
|
|
|
114 |
"save_type": "model"
|
115 |
}]
|
116 |
}
|