isaaccorley
commited on
Commit
•
8f23d47
1
Parent(s):
e75d762
Upload 4 files
Browse files- swin-v2-rgb/config.json +221 -0
- swin-v2-rgb/config.yaml +37 -0
- swin-v2-rgb/log_rank0.txt +0 -0
- swin-v2-rgb/log_rank1.txt +0 -0
swin-v2-rgb/config.json
ADDED
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
AMP_ENABLE: true
|
2 |
+
AMP_OPT_LEVEL: ''
|
3 |
+
AUG:
|
4 |
+
AUTO_AUGMENT: rand-m9-mstd0.5-inc1
|
5 |
+
COLOR_JITTER: 0.4
|
6 |
+
CUTMIX: 1.0
|
7 |
+
CUTMIX_MINMAX: null
|
8 |
+
MIXUP: 0.8
|
9 |
+
MIXUP_MODE: batch
|
10 |
+
MIXUP_PROB: 1.0
|
11 |
+
MIXUP_SWITCH_PROB: 0.5
|
12 |
+
RECOUNT: 1
|
13 |
+
REMODE: pixel
|
14 |
+
REPROB: 0.25
|
15 |
+
BASE:
|
16 |
+
- ''
|
17 |
+
DATA:
|
18 |
+
BANDS: rgb
|
19 |
+
BATCH_SIZE: 64
|
20 |
+
CACHE_MODE: part
|
21 |
+
CHANNELS: 3
|
22 |
+
DATASET: imagenet
|
23 |
+
DATA_PATH: /workspace/storage/data/hydro/images/
|
24 |
+
IMG_SIZE: 256
|
25 |
+
INTERPOLATION: bicubic
|
26 |
+
MASK_PATCH_SIZE: 32
|
27 |
+
MASK_RATIO: 0.6
|
28 |
+
MEAN:
|
29 |
+
- 340.76769064
|
30 |
+
- 429.9430203
|
31 |
+
- 614.21682446
|
32 |
+
- 590.23569706
|
33 |
+
- 950.68368468
|
34 |
+
- 1792.46290469
|
35 |
+
- 2075.46795189
|
36 |
+
- 2218.94553375
|
37 |
+
- 2266.46036911
|
38 |
+
- 2246.0605464
|
39 |
+
- 1594.42694882
|
40 |
+
- 1009.32729131
|
41 |
+
NUM_WORKERS: 8
|
42 |
+
PIN_MEMORY: true
|
43 |
+
STD:
|
44 |
+
- 554.81258967
|
45 |
+
- 572.41639287
|
46 |
+
- 582.87945694
|
47 |
+
- 675.88746967
|
48 |
+
- 729.89827633
|
49 |
+
- 1096.01480586
|
50 |
+
- 1273.45393088
|
51 |
+
- 1365.45589904
|
52 |
+
- 1356.13789355
|
53 |
+
- 1302.3292881
|
54 |
+
- 1079.19066363
|
55 |
+
- 818.86747235
|
56 |
+
ZIP_MODE: false
|
57 |
+
ENABLE_AMP: true
|
58 |
+
EVAL_MODE: false
|
59 |
+
FUSED_LAYERNORM: false
|
60 |
+
FUSED_WINDOW_PROCESS: false
|
61 |
+
LOCAL_RANK: 0
|
62 |
+
MODEL:
|
63 |
+
DROP_PATH_RATE: 0.1
|
64 |
+
DROP_RATE: 0.0
|
65 |
+
IN_CHANS: 3
|
66 |
+
LABEL_SMOOTHING: 0.1
|
67 |
+
NAME: hydro_rgb_simmim_pretrain
|
68 |
+
NUM_CLASSES: 1000
|
69 |
+
PRETRAINED: ''
|
70 |
+
RESUME: ''
|
71 |
+
SIMMIM:
|
72 |
+
NORM_TARGET:
|
73 |
+
ENABLE: true
|
74 |
+
PATCH_SIZE: 47
|
75 |
+
SWIN:
|
76 |
+
APE: false
|
77 |
+
DEPTHS:
|
78 |
+
- 2
|
79 |
+
- 2
|
80 |
+
- 6
|
81 |
+
- 2
|
82 |
+
EMBED_DIM: 96
|
83 |
+
IN_CHANS: 3
|
84 |
+
MLP_RATIO: 4.0
|
85 |
+
NUM_HEADS:
|
86 |
+
- 3
|
87 |
+
- 6
|
88 |
+
- 12
|
89 |
+
- 24
|
90 |
+
PATCH_NORM: true
|
91 |
+
PATCH_SIZE: 4
|
92 |
+
QKV_BIAS: true
|
93 |
+
QK_SCALE: null
|
94 |
+
WINDOW_SIZE: 7
|
95 |
+
SWINV2:
|
96 |
+
APE: false
|
97 |
+
DEPTHS:
|
98 |
+
- 2
|
99 |
+
- 2
|
100 |
+
- 18
|
101 |
+
- 2
|
102 |
+
EMBED_DIM: 128
|
103 |
+
IN_CHANS: 3
|
104 |
+
MLP_RATIO: 4.0
|
105 |
+
NUM_HEADS:
|
106 |
+
- 4
|
107 |
+
- 8
|
108 |
+
- 16
|
109 |
+
- 32
|
110 |
+
PATCH_NORM: true
|
111 |
+
PATCH_SIZE: 4
|
112 |
+
PRETRAINED_WINDOW_SIZES:
|
113 |
+
- 0
|
114 |
+
- 0
|
115 |
+
- 0
|
116 |
+
- 0
|
117 |
+
QKV_BIAS: true
|
118 |
+
WINDOW_SIZE: 16
|
119 |
+
SWIN_MLP:
|
120 |
+
APE: false
|
121 |
+
DEPTHS:
|
122 |
+
- 2
|
123 |
+
- 2
|
124 |
+
- 6
|
125 |
+
- 2
|
126 |
+
EMBED_DIM: 96
|
127 |
+
IN_CHANS: 3
|
128 |
+
MLP_RATIO: 4.0
|
129 |
+
NUM_HEADS:
|
130 |
+
- 3
|
131 |
+
- 6
|
132 |
+
- 12
|
133 |
+
- 24
|
134 |
+
PATCH_NORM: true
|
135 |
+
PATCH_SIZE: 4
|
136 |
+
WINDOW_SIZE: 7
|
137 |
+
SWIN_MOE:
|
138 |
+
APE: false
|
139 |
+
AUX_LOSS_WEIGHT: 0.01
|
140 |
+
CAPACITY_FACTOR: 1.25
|
141 |
+
COSINE_ROUTER: false
|
142 |
+
COSINE_ROUTER_DIM: 256
|
143 |
+
COSINE_ROUTER_INIT_T: 0.5
|
144 |
+
DEPTHS:
|
145 |
+
- 2
|
146 |
+
- 2
|
147 |
+
- 6
|
148 |
+
- 2
|
149 |
+
EMBED_DIM: 96
|
150 |
+
GATE_NOISE: 1.0
|
151 |
+
INIT_STD: 0.02
|
152 |
+
IN_CHANS: 3
|
153 |
+
IS_GSHARD_LOSS: false
|
154 |
+
MLP_FC2_BIAS: true
|
155 |
+
MLP_RATIO: 4.0
|
156 |
+
MOE_BLOCKS:
|
157 |
+
- - -1
|
158 |
+
- - -1
|
159 |
+
- - -1
|
160 |
+
- - -1
|
161 |
+
MOE_DROP: 0.0
|
162 |
+
NORMALIZE_GATE: false
|
163 |
+
NUM_HEADS:
|
164 |
+
- 3
|
165 |
+
- 6
|
166 |
+
- 12
|
167 |
+
- 24
|
168 |
+
NUM_LOCAL_EXPERTS: 1
|
169 |
+
PATCH_NORM: true
|
170 |
+
PATCH_SIZE: 4
|
171 |
+
PRETRAINED_WINDOW_SIZES:
|
172 |
+
- 0
|
173 |
+
- 0
|
174 |
+
- 0
|
175 |
+
- 0
|
176 |
+
QKV_BIAS: true
|
177 |
+
QK_SCALE: null
|
178 |
+
TOP_VALUE: 1
|
179 |
+
USE_BPR: true
|
180 |
+
WINDOW_SIZE: 7
|
181 |
+
TYPE: swinv2
|
182 |
+
OUTPUT: output/hydro_rgb_simmim_pretrain/hydro_rgb_simmim_pretrain_swinv2_base_img256_window16_800ep
|
183 |
+
PRINT_FREQ: 100
|
184 |
+
SAVE_FREQ: 5
|
185 |
+
SEED: 0
|
186 |
+
TAG: hydro_rgb_simmim_pretrain_swinv2_base_img256_window16_800ep
|
187 |
+
TEST:
|
188 |
+
CROP: true
|
189 |
+
SEQUENTIAL: false
|
190 |
+
SHUFFLE: false
|
191 |
+
THROUGHPUT_MODE: false
|
192 |
+
TRAIN:
|
193 |
+
ACCUMULATION_STEPS: 1
|
194 |
+
AUTO_RESUME: true
|
195 |
+
BASE_LR: 2.5e-05
|
196 |
+
CLIP_GRAD: 5.0
|
197 |
+
EPOCHS: 800
|
198 |
+
LAYER_DECAY: 1.0
|
199 |
+
LR_SCHEDULER:
|
200 |
+
DECAY_EPOCHS: 30
|
201 |
+
DECAY_RATE: 0.1
|
202 |
+
GAMMA: 0.1
|
203 |
+
MULTISTEPS:
|
204 |
+
- 700
|
205 |
+
NAME: multistep
|
206 |
+
WARMUP_PREFIX: true
|
207 |
+
MIN_LR: 1.25e-06
|
208 |
+
MOE:
|
209 |
+
SAVE_MASTER: false
|
210 |
+
OPTIMIZER:
|
211 |
+
BETAS:
|
212 |
+
- 0.9
|
213 |
+
- 0.999
|
214 |
+
EPS: 1.0e-08
|
215 |
+
MOMENTUM: 0.9
|
216 |
+
NAME: adamw
|
217 |
+
START_EPOCH: 0
|
218 |
+
USE_CHECKPOINT: false
|
219 |
+
WARMUP_EPOCHS: 10
|
220 |
+
WARMUP_LR: 1.25e-07
|
221 |
+
WEIGHT_DECAY: 0.05
|
swin-v2-rgb/config.yaml
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
MODEL:
|
2 |
+
TYPE: swinv2
|
3 |
+
NAME: hydro_rgb_simmim_pretrain
|
4 |
+
PRETRAINED: checkpoints/swin-v2-rgb/ckpt_epoch_799.pth
|
5 |
+
DROP_PATH_RATE: 0.1
|
6 |
+
SIMMIM:
|
7 |
+
NORM_TARGET:
|
8 |
+
ENABLE: True
|
9 |
+
PATCH_SIZE: 47
|
10 |
+
SWINV2:
|
11 |
+
EMBED_DIM: 128
|
12 |
+
DEPTHS: [ 2, 2, 18, 2 ]
|
13 |
+
NUM_HEADS: [ 4, 8, 16, 32 ]
|
14 |
+
WINDOW_SIZE: 16
|
15 |
+
IN_CHANS: 3
|
16 |
+
DATA:
|
17 |
+
DATA_PATH: /workspace/storage/data/hydro/images/
|
18 |
+
BANDS: rgb
|
19 |
+
CHANNELS: 3
|
20 |
+
IMG_SIZE: 256
|
21 |
+
MASK_PATCH_SIZE: 32
|
22 |
+
MASK_RATIO: 0.6
|
23 |
+
MEAN: [340.76769064, 429.9430203, 614.21682446, 590.23569706, 950.68368468, 1792.46290469, 2075.46795189, 2218.94553375, 2266.46036911, 2246.0605464, 1594.42694882, 1009.32729131]
|
24 |
+
STD: [554.81258967, 572.41639287, 582.87945694, 675.88746967, 729.89827633, 1096.01480586, 1273.45393088, 1365.45589904, 1356.13789355, 1302.3292881, 1079.19066363, 818.86747235]
|
25 |
+
TRAIN:
|
26 |
+
EPOCHS: 800
|
27 |
+
WARMUP_EPOCHS: 10
|
28 |
+
BASE_LR: 1e-4
|
29 |
+
WARMUP_LR: 5e-7
|
30 |
+
WEIGHT_DECAY: 0.05
|
31 |
+
LR_SCHEDULER:
|
32 |
+
NAME: 'multistep'
|
33 |
+
GAMMA: 0.1
|
34 |
+
MULTISTEPS: [700,]
|
35 |
+
PRINT_FREQ: 100
|
36 |
+
SAVE_FREQ: 5
|
37 |
+
TAG: hydro_rgb_simmim_pretrain_swinv2_base_img256_window16_800ep
|
swin-v2-rgb/log_rank0.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
swin-v2-rgb/log_rank1.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|